From c5866aa5d027d1b7a0f8d14499a9ebaab8433e02 Mon Sep 17 00:00:00 2001 From: Void Date: Wed, 20 Oct 2021 09:46:14 -0400 Subject: [PATCH 01/15] bump up cutlass upstream to 2.7 --- cutlass | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/cutlass b/cutlass index c2b80ad..2e07c4c 160000 --- a/cutlass +++ b/cutlass @@ -1 +1 @@ -Subproject commit c2b80ad4e4f8b60a65500bd04c8fecddff2ba355 +Subproject commit 2e07c4cc2fc94f4cd396ecf1e9132caf1efba50e From 6df6200a12208edc6a816cf0e71eaba450c88af5 Mon Sep 17 00:00:00 2001 From: Void Date: Sat, 23 Oct 2021 07:55:42 -0400 Subject: [PATCH 02/15] fixes for build against cutlass 2.7 version bump --- examples/00_minplus_srgemm/CMakeLists.txt | 1 + include/cuasr/reduction/kernel/reduce_split_k.h | 4 ++-- test/regress/CMakeLists.txt | 1 + 3 files changed, 4 insertions(+), 2 deletions(-) diff --git a/examples/00_minplus_srgemm/CMakeLists.txt b/examples/00_minplus_srgemm/CMakeLists.txt index 3ea6fe6..2677001 100644 --- a/examples/00_minplus_srgemm/CMakeLists.txt +++ b/examples/00_minplus_srgemm/CMakeLists.txt @@ -5,6 +5,7 @@ target_include_directories(minplus_srgemm PRIVATE ${PROJECT_SOURCE_DIR}/include ${PROJECT_SOURCE_DIR}/cutlass/include + ${PROJECT_SOURCE_DIR}/cutlass/tools/util/include ${CUDA_INCLUDE_DIRS} ) target_compile_options(minplus_srgemm diff --git a/include/cuasr/reduction/kernel/reduce_split_k.h b/include/cuasr/reduction/kernel/reduce_split_k.h index 83397ef..d7108f5 100644 --- a/include/cuasr/reduction/kernel/reduce_split_k.h +++ b/include/cuasr/reduction/kernel/reduce_split_k.h @@ -147,8 +147,8 @@ class ReduceSplitK { // Determine CTA position cutlass::MatrixCoord thread_offset( - int(blockIdx.x) * Shape::kRow + threadIdx.y, - int(blockIdx.y) * Shape::kColumn + threadIdx.x * kElementsPerAccess + cutlass::MatrixCoord::Index(int(blockIdx.x) * Shape::kRow + threadIdx.y), + cutlass::MatrixCoord::Index(int(blockIdx.y) * Shape::kColumn + threadIdx.x * kElementsPerAccess) ); // One guard conditional diff --git a/test/regress/CMakeLists.txt b/test/regress/CMakeLists.txt index ff04a4f..108d047 100644 --- a/test/regress/CMakeLists.txt +++ b/test/regress/CMakeLists.txt @@ -6,6 +6,7 @@ add_library(deprecated_libfwgpu ${cuASR_LIB_TYPE} target_include_directories(deprecated_libfwgpu PUBLIC ${PROJECT_SOURCE_DIR}/include ${CUDA_INCLUDE_DIRS} PRIVATE ${PROJECT_SOURCE_DIR}/cutlass/include + PRIVATE ${PROJECT_SOURCE_DIR}/cutlass/tools/util/include PRIVATE ${PROJECT_SOURCE_DIR}/test/regress/include ) target_compile_options(deprecated_libfwgpu From e968316dd13c1a6d26a3e666c57640479795ae51 Mon Sep 17 00:00:00 2001 From: Void Date: Sat, 23 Oct 2021 08:00:59 -0400 Subject: [PATCH 03/15] nits --- README.md | 2 +- .../cuasr/gemm/threadblock/srmma_pipelined.h | 17 ++++++----------- 2 files changed, 7 insertions(+), 12 deletions(-) diff --git a/README.md b/README.md index 96235ca..0fcd465 100644 --- a/README.md +++ b/README.md @@ -21,7 +21,7 @@ Normally, BLAS libraries are defined as operations over real numbers,`+` and `x` cuASR is a template library and therefore header only, but includes an exhaustive list of tests and benchmarks. The build system is based on `CMake`. Basic checkout and build instructions are as follows: ```sh -$ git clone --recurse-submodules https://github.com/hpcgarage/semiring-gemm /path/to/repo +$ git clone --recurse-submodules https://github.com/hpcgarage/cuASR /path/to/repo $ cd /path/to/repo $ mkdir build && cd build $ cmake .. -G Ninja -DCUASR_CUDA_ARCHS="70 75" diff --git a/include/cuasr/gemm/threadblock/srmma_pipelined.h b/include/cuasr/gemm/threadblock/srmma_pipelined.h index 49ca9c1..c4ba4e1 100644 --- a/include/cuasr/gemm/threadblock/srmma_pipelined.h +++ b/include/cuasr/gemm/threadblock/srmma_pipelined.h @@ -53,8 +53,7 @@ template < typename SmemIteratorA_::Element, typename IteratorA_::Element, IteratorA_::Fragment::kElements>, - /// - /// Transformation applied to A operand + /// Transformation applied to B operand typename TransformB_ = cutlass::NumericArrayConverter< typename SmemIteratorB_::Element, typename IteratorB_::Element, @@ -124,7 +123,7 @@ class SrmmaPipelined : public cutlass::gemm::threadblock::MmaBase Date: Thu, 28 Oct 2021 14:45:47 -0400 Subject: [PATCH 04/15] set and require C++14 for CUDA --- CMakeLists.txt | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/CMakeLists.txt b/CMakeLists.txt index 6a40f42..ae527f2 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -29,6 +29,11 @@ option(CUASR_CUDA_ARCHS "List of CUDA architectures to compile for." "60 61 70 7 find_package(CUDA REQUIRED) set(CMAKE_CXX_EXTENSIONS OFF) set(CMAKE_CXX_STANDARD 14) +set(CMAKE_CXX_STANDARD_REQUIRED ON) +set(CMAKE_CXX_EXTENSIONS OFF) + +set(CMAKE_CUDA_STANDARD 14) +set(CMAKE_CUDA_STANDARD_REQUIRED TRUE) # C++ compiler flags for target compile options set(cuASR_CXX_FLAGS -Wall -Wextra -Wno-unused-parameter -Wno-uninitialized -Wno-strict-aliasing) From 55b372c5c7ec0a6863f05b6778a0234f69b9d0c7 Mon Sep 17 00:00:00 2001 From: Void Date: Sat, 30 Oct 2021 15:11:36 -0400 Subject: [PATCH 05/15] generalize test generator and rename test files in prep for SM80 --- test/device/{simt_sm50.py => gen_simt.py} | 31 +++++++++++++------ ...simt_binary_or_binary_and_dsrgemm_nn_n.cu} | 0 ...simt_binary_or_binary_and_dsrgemm_nn_t.cu} | 0 ...simt_binary_or_binary_and_dsrgemm_nt_n.cu} | 0 ...simt_binary_or_binary_and_dsrgemm_nt_t.cu} | 0 ...simt_binary_or_binary_and_dsrgemm_tn_n.cu} | 0 ...simt_binary_or_binary_and_dsrgemm_tn_t.cu} | 0 ...simt_binary_or_binary_and_dsrgemm_tt_n.cu} | 0 ...simt_binary_or_binary_and_dsrgemm_tt_t.cu} | 0 ...simt_binary_or_binary_and_ssrgemm_nn_n.cu} | 0 ...simt_binary_or_binary_and_ssrgemm_nn_t.cu} | 0 ...simt_binary_or_binary_and_ssrgemm_nt_n.cu} | 0 ...simt_binary_or_binary_and_ssrgemm_nt_t.cu} | 0 ...simt_binary_or_binary_and_ssrgemm_tn_n.cu} | 0 ...simt_binary_or_binary_and_ssrgemm_tn_t.cu} | 0 ...simt_binary_or_binary_and_ssrgemm_tt_n.cu} | 0 ...simt_binary_or_binary_and_ssrgemm_tt_t.cu} | 0 ...sm50_simt_maximum_minimum_dsrgemm_nn_n.cu} | 0 ...sm50_simt_maximum_minimum_dsrgemm_nn_t.cu} | 0 ...sm50_simt_maximum_minimum_dsrgemm_nt_n.cu} | 0 ...sm50_simt_maximum_minimum_dsrgemm_nt_t.cu} | 0 ...sm50_simt_maximum_minimum_dsrgemm_tn_n.cu} | 0 ...sm50_simt_maximum_minimum_dsrgemm_tn_t.cu} | 0 ...sm50_simt_maximum_minimum_dsrgemm_tt_n.cu} | 0 ...sm50_simt_maximum_minimum_dsrgemm_tt_t.cu} | 0 ...sm50_simt_maximum_minimum_ssrgemm_nn_n.cu} | 0 ...sm50_simt_maximum_minimum_ssrgemm_nn_t.cu} | 0 ...sm50_simt_maximum_minimum_ssrgemm_nt_n.cu} | 0 ...sm50_simt_maximum_minimum_ssrgemm_nt_t.cu} | 0 ...sm50_simt_maximum_minimum_ssrgemm_tn_n.cu} | 0 ...sm50_simt_maximum_minimum_ssrgemm_tn_t.cu} | 0 ...sm50_simt_maximum_minimum_ssrgemm_tt_n.cu} | 0 ...sm50_simt_maximum_minimum_ssrgemm_tt_t.cu} | 0 ...0_simt_maximum_multiplies_dsrgemm_nn_n.cu} | 0 ...0_simt_maximum_multiplies_dsrgemm_nn_t.cu} | 0 ...0_simt_maximum_multiplies_dsrgemm_nt_n.cu} | 0 ...0_simt_maximum_multiplies_dsrgemm_nt_t.cu} | 0 ...0_simt_maximum_multiplies_dsrgemm_tn_n.cu} | 0 ...0_simt_maximum_multiplies_dsrgemm_tn_t.cu} | 0 ...0_simt_maximum_multiplies_dsrgemm_tt_n.cu} | 0 ...0_simt_maximum_multiplies_dsrgemm_tt_t.cu} | 0 ...0_simt_maximum_multiplies_ssrgemm_nn_n.cu} | 0 ...0_simt_maximum_multiplies_ssrgemm_nn_t.cu} | 0 ...0_simt_maximum_multiplies_ssrgemm_nt_n.cu} | 0 ...0_simt_maximum_multiplies_ssrgemm_nt_t.cu} | 0 ...0_simt_maximum_multiplies_ssrgemm_tn_n.cu} | 0 ...0_simt_maximum_multiplies_ssrgemm_tn_t.cu} | 0 ...0_simt_maximum_multiplies_ssrgemm_tt_n.cu} | 0 ...0_simt_maximum_multiplies_ssrgemm_tt_t.cu} | 0 ...=> sm50_simt_maximum_plus_dsrgemm_nn_n.cu} | 0 ...=> sm50_simt_maximum_plus_dsrgemm_nn_t.cu} | 0 ...=> sm50_simt_maximum_plus_dsrgemm_nt_n.cu} | 0 ...=> sm50_simt_maximum_plus_dsrgemm_nt_t.cu} | 0 ...=> sm50_simt_maximum_plus_dsrgemm_tn_n.cu} | 0 ...=> sm50_simt_maximum_plus_dsrgemm_tn_t.cu} | 0 ...=> sm50_simt_maximum_plus_dsrgemm_tt_n.cu} | 0 ...=> sm50_simt_maximum_plus_dsrgemm_tt_t.cu} | 0 ...=> sm50_simt_maximum_plus_ssrgemm_nn_n.cu} | 0 ...=> sm50_simt_maximum_plus_ssrgemm_nn_t.cu} | 0 ...=> sm50_simt_maximum_plus_ssrgemm_nt_n.cu} | 0 ...=> sm50_simt_maximum_plus_ssrgemm_nt_t.cu} | 0 ...=> sm50_simt_maximum_plus_ssrgemm_tn_n.cu} | 0 ...=> sm50_simt_maximum_plus_ssrgemm_tn_t.cu} | 0 ...=> sm50_simt_maximum_plus_ssrgemm_tt_n.cu} | 0 ...=> sm50_simt_maximum_plus_ssrgemm_tt_t.cu} | 0 ...sm50_simt_minimum_maximum_dsrgemm_nn_n.cu} | 0 ...sm50_simt_minimum_maximum_dsrgemm_nn_t.cu} | 0 ...sm50_simt_minimum_maximum_dsrgemm_nt_n.cu} | 0 ...sm50_simt_minimum_maximum_dsrgemm_nt_t.cu} | 0 ...sm50_simt_minimum_maximum_dsrgemm_tn_n.cu} | 0 ...sm50_simt_minimum_maximum_dsrgemm_tn_t.cu} | 0 ...sm50_simt_minimum_maximum_dsrgemm_tt_n.cu} | 0 ...sm50_simt_minimum_maximum_dsrgemm_tt_t.cu} | 0 ...sm50_simt_minimum_maximum_ssrgemm_nn_n.cu} | 0 ...sm50_simt_minimum_maximum_ssrgemm_nn_t.cu} | 0 ...sm50_simt_minimum_maximum_ssrgemm_nt_n.cu} | 0 ...sm50_simt_minimum_maximum_ssrgemm_nt_t.cu} | 0 ...sm50_simt_minimum_maximum_ssrgemm_tn_n.cu} | 0 ...sm50_simt_minimum_maximum_ssrgemm_tn_t.cu} | 0 ...sm50_simt_minimum_maximum_ssrgemm_tt_n.cu} | 0 ...sm50_simt_minimum_maximum_ssrgemm_tt_t.cu} | 0 ...0_simt_minimum_multiplies_dsrgemm_nn_n.cu} | 0 ...0_simt_minimum_multiplies_dsrgemm_nn_t.cu} | 0 ...0_simt_minimum_multiplies_dsrgemm_nt_n.cu} | 0 ...0_simt_minimum_multiplies_dsrgemm_nt_t.cu} | 0 ...0_simt_minimum_multiplies_dsrgemm_tn_n.cu} | 0 ...0_simt_minimum_multiplies_dsrgemm_tn_t.cu} | 0 ...0_simt_minimum_multiplies_dsrgemm_tt_n.cu} | 0 ...0_simt_minimum_multiplies_dsrgemm_tt_t.cu} | 0 ...0_simt_minimum_multiplies_ssrgemm_nn_n.cu} | 0 ...0_simt_minimum_multiplies_ssrgemm_nn_t.cu} | 0 ...0_simt_minimum_multiplies_ssrgemm_nt_n.cu} | 0 ...0_simt_minimum_multiplies_ssrgemm_nt_t.cu} | 0 ...0_simt_minimum_multiplies_ssrgemm_tn_n.cu} | 0 ...0_simt_minimum_multiplies_ssrgemm_tn_t.cu} | 0 ...0_simt_minimum_multiplies_ssrgemm_tt_n.cu} | 0 ...0_simt_minimum_multiplies_ssrgemm_tt_t.cu} | 0 ...=> sm50_simt_minimum_plus_dsrgemm_nn_n.cu} | 0 ...=> sm50_simt_minimum_plus_dsrgemm_nn_t.cu} | 0 ...=> sm50_simt_minimum_plus_dsrgemm_nt_n.cu} | 0 ...=> sm50_simt_minimum_plus_dsrgemm_nt_t.cu} | 0 ...=> sm50_simt_minimum_plus_dsrgemm_tn_n.cu} | 0 ...=> sm50_simt_minimum_plus_dsrgemm_tn_t.cu} | 0 ...=> sm50_simt_minimum_plus_dsrgemm_tt_n.cu} | 0 ...=> sm50_simt_minimum_plus_dsrgemm_tt_t.cu} | 0 ...=> sm50_simt_minimum_plus_ssrgemm_nn_n.cu} | 0 ...=> sm50_simt_minimum_plus_ssrgemm_nn_t.cu} | 0 ...=> sm50_simt_minimum_plus_ssrgemm_nt_n.cu} | 0 ...=> sm50_simt_minimum_plus_ssrgemm_nt_t.cu} | 0 ...=> sm50_simt_minimum_plus_ssrgemm_tn_n.cu} | 0 ...=> sm50_simt_minimum_plus_ssrgemm_tn_t.cu} | 0 ...=> sm50_simt_minimum_plus_ssrgemm_tt_n.cu} | 0 ...=> sm50_simt_minimum_plus_ssrgemm_tt_t.cu} | 0 ...sm50_simt_plus_multiplies_dsrgemm_nn_n.cu} | 0 ...sm50_simt_plus_multiplies_dsrgemm_nn_t.cu} | 0 ...sm50_simt_plus_multiplies_dsrgemm_nt_n.cu} | 0 ...sm50_simt_plus_multiplies_dsrgemm_nt_t.cu} | 0 ...sm50_simt_plus_multiplies_dsrgemm_tn_n.cu} | 0 ...sm50_simt_plus_multiplies_dsrgemm_tn_t.cu} | 0 ...sm50_simt_plus_multiplies_dsrgemm_tt_n.cu} | 0 ...sm50_simt_plus_multiplies_dsrgemm_tt_t.cu} | 0 ...sm50_simt_plus_multiplies_ssrgemm_nn_n.cu} | 0 ...sm50_simt_plus_multiplies_ssrgemm_nn_t.cu} | 0 ...sm50_simt_plus_multiplies_ssrgemm_nt_n.cu} | 0 ...sm50_simt_plus_multiplies_ssrgemm_nt_t.cu} | 0 ...sm50_simt_plus_multiplies_ssrgemm_tn_n.cu} | 0 ...sm50_simt_plus_multiplies_ssrgemm_tn_t.cu} | 0 ...sm50_simt_plus_multiplies_ssrgemm_tt_n.cu} | 0 ...sm50_simt_plus_multiplies_ssrgemm_tt_t.cu} | 0 129 files changed, 21 insertions(+), 10 deletions(-) rename test/device/{simt_sm50.py => gen_simt.py} (93%) rename test/device/{simt_binary_or_binary_and_dsrgemm_nn_n_sm50.cu => sm50_simt_binary_or_binary_and_dsrgemm_nn_n.cu} (100%) rename test/device/{simt_binary_or_binary_and_dsrgemm_nn_t_sm50.cu => sm50_simt_binary_or_binary_and_dsrgemm_nn_t.cu} (100%) rename test/device/{simt_binary_or_binary_and_dsrgemm_nt_n_sm50.cu => sm50_simt_binary_or_binary_and_dsrgemm_nt_n.cu} (100%) rename test/device/{simt_binary_or_binary_and_dsrgemm_nt_t_sm50.cu => sm50_simt_binary_or_binary_and_dsrgemm_nt_t.cu} (100%) rename test/device/{simt_binary_or_binary_and_dsrgemm_tn_n_sm50.cu => sm50_simt_binary_or_binary_and_dsrgemm_tn_n.cu} (100%) rename test/device/{simt_binary_or_binary_and_dsrgemm_tn_t_sm50.cu => sm50_simt_binary_or_binary_and_dsrgemm_tn_t.cu} (100%) rename test/device/{simt_binary_or_binary_and_dsrgemm_tt_n_sm50.cu => sm50_simt_binary_or_binary_and_dsrgemm_tt_n.cu} (100%) rename test/device/{simt_binary_or_binary_and_dsrgemm_tt_t_sm50.cu => sm50_simt_binary_or_binary_and_dsrgemm_tt_t.cu} (100%) rename test/device/{simt_binary_or_binary_and_ssrgemm_nn_n_sm50.cu => sm50_simt_binary_or_binary_and_ssrgemm_nn_n.cu} (100%) rename test/device/{simt_binary_or_binary_and_ssrgemm_nn_t_sm50.cu => sm50_simt_binary_or_binary_and_ssrgemm_nn_t.cu} (100%) rename test/device/{simt_binary_or_binary_and_ssrgemm_nt_n_sm50.cu => sm50_simt_binary_or_binary_and_ssrgemm_nt_n.cu} (100%) rename test/device/{simt_binary_or_binary_and_ssrgemm_nt_t_sm50.cu => sm50_simt_binary_or_binary_and_ssrgemm_nt_t.cu} (100%) rename test/device/{simt_binary_or_binary_and_ssrgemm_tn_n_sm50.cu => sm50_simt_binary_or_binary_and_ssrgemm_tn_n.cu} (100%) rename test/device/{simt_binary_or_binary_and_ssrgemm_tn_t_sm50.cu => sm50_simt_binary_or_binary_and_ssrgemm_tn_t.cu} (100%) rename test/device/{simt_binary_or_binary_and_ssrgemm_tt_n_sm50.cu => sm50_simt_binary_or_binary_and_ssrgemm_tt_n.cu} (100%) rename test/device/{simt_binary_or_binary_and_ssrgemm_tt_t_sm50.cu => sm50_simt_binary_or_binary_and_ssrgemm_tt_t.cu} (100%) rename test/device/{simt_maximum_minimum_dsrgemm_nn_n_sm50.cu => sm50_simt_maximum_minimum_dsrgemm_nn_n.cu} (100%) rename test/device/{simt_maximum_minimum_dsrgemm_nn_t_sm50.cu => sm50_simt_maximum_minimum_dsrgemm_nn_t.cu} (100%) rename test/device/{simt_maximum_minimum_dsrgemm_nt_n_sm50.cu => sm50_simt_maximum_minimum_dsrgemm_nt_n.cu} (100%) rename test/device/{simt_maximum_minimum_dsrgemm_nt_t_sm50.cu => sm50_simt_maximum_minimum_dsrgemm_nt_t.cu} (100%) rename test/device/{simt_maximum_minimum_dsrgemm_tn_n_sm50.cu => sm50_simt_maximum_minimum_dsrgemm_tn_n.cu} (100%) rename test/device/{simt_maximum_minimum_dsrgemm_tn_t_sm50.cu => sm50_simt_maximum_minimum_dsrgemm_tn_t.cu} (100%) rename test/device/{simt_maximum_minimum_dsrgemm_tt_n_sm50.cu => sm50_simt_maximum_minimum_dsrgemm_tt_n.cu} (100%) rename test/device/{simt_maximum_minimum_dsrgemm_tt_t_sm50.cu => sm50_simt_maximum_minimum_dsrgemm_tt_t.cu} (100%) rename test/device/{simt_maximum_minimum_ssrgemm_nn_n_sm50.cu => sm50_simt_maximum_minimum_ssrgemm_nn_n.cu} (100%) rename test/device/{simt_maximum_minimum_ssrgemm_nn_t_sm50.cu => sm50_simt_maximum_minimum_ssrgemm_nn_t.cu} (100%) rename test/device/{simt_maximum_minimum_ssrgemm_nt_n_sm50.cu => sm50_simt_maximum_minimum_ssrgemm_nt_n.cu} (100%) rename test/device/{simt_maximum_minimum_ssrgemm_nt_t_sm50.cu => sm50_simt_maximum_minimum_ssrgemm_nt_t.cu} (100%) rename test/device/{simt_maximum_minimum_ssrgemm_tn_n_sm50.cu => sm50_simt_maximum_minimum_ssrgemm_tn_n.cu} (100%) rename test/device/{simt_maximum_minimum_ssrgemm_tn_t_sm50.cu => sm50_simt_maximum_minimum_ssrgemm_tn_t.cu} (100%) rename test/device/{simt_maximum_minimum_ssrgemm_tt_n_sm50.cu => sm50_simt_maximum_minimum_ssrgemm_tt_n.cu} (100%) rename test/device/{simt_maximum_minimum_ssrgemm_tt_t_sm50.cu => sm50_simt_maximum_minimum_ssrgemm_tt_t.cu} (100%) rename test/device/{simt_maximum_multiplies_dsrgemm_nn_n_sm50.cu => sm50_simt_maximum_multiplies_dsrgemm_nn_n.cu} (100%) rename test/device/{simt_maximum_multiplies_dsrgemm_nn_t_sm50.cu => sm50_simt_maximum_multiplies_dsrgemm_nn_t.cu} (100%) rename test/device/{simt_maximum_multiplies_dsrgemm_nt_n_sm50.cu => sm50_simt_maximum_multiplies_dsrgemm_nt_n.cu} (100%) rename test/device/{simt_maximum_multiplies_dsrgemm_nt_t_sm50.cu => sm50_simt_maximum_multiplies_dsrgemm_nt_t.cu} (100%) rename test/device/{simt_maximum_multiplies_dsrgemm_tn_n_sm50.cu => sm50_simt_maximum_multiplies_dsrgemm_tn_n.cu} (100%) rename test/device/{simt_maximum_multiplies_dsrgemm_tn_t_sm50.cu => sm50_simt_maximum_multiplies_dsrgemm_tn_t.cu} (100%) rename test/device/{simt_maximum_multiplies_dsrgemm_tt_n_sm50.cu => sm50_simt_maximum_multiplies_dsrgemm_tt_n.cu} (100%) rename test/device/{simt_maximum_multiplies_dsrgemm_tt_t_sm50.cu => sm50_simt_maximum_multiplies_dsrgemm_tt_t.cu} (100%) rename test/device/{simt_maximum_multiplies_ssrgemm_nn_n_sm50.cu => sm50_simt_maximum_multiplies_ssrgemm_nn_n.cu} (100%) rename test/device/{simt_maximum_multiplies_ssrgemm_nn_t_sm50.cu => sm50_simt_maximum_multiplies_ssrgemm_nn_t.cu} (100%) rename test/device/{simt_maximum_multiplies_ssrgemm_nt_n_sm50.cu => sm50_simt_maximum_multiplies_ssrgemm_nt_n.cu} (100%) rename test/device/{simt_maximum_multiplies_ssrgemm_nt_t_sm50.cu => sm50_simt_maximum_multiplies_ssrgemm_nt_t.cu} (100%) rename test/device/{simt_maximum_multiplies_ssrgemm_tn_n_sm50.cu => sm50_simt_maximum_multiplies_ssrgemm_tn_n.cu} (100%) rename test/device/{simt_maximum_multiplies_ssrgemm_tn_t_sm50.cu => sm50_simt_maximum_multiplies_ssrgemm_tn_t.cu} (100%) rename test/device/{simt_maximum_multiplies_ssrgemm_tt_n_sm50.cu => sm50_simt_maximum_multiplies_ssrgemm_tt_n.cu} (100%) rename test/device/{simt_maximum_multiplies_ssrgemm_tt_t_sm50.cu => sm50_simt_maximum_multiplies_ssrgemm_tt_t.cu} (100%) rename test/device/{simt_maximum_plus_dsrgemm_nn_n_sm50.cu => sm50_simt_maximum_plus_dsrgemm_nn_n.cu} (100%) rename test/device/{simt_maximum_plus_dsrgemm_nn_t_sm50.cu => sm50_simt_maximum_plus_dsrgemm_nn_t.cu} (100%) rename test/device/{simt_maximum_plus_dsrgemm_nt_n_sm50.cu => sm50_simt_maximum_plus_dsrgemm_nt_n.cu} (100%) rename test/device/{simt_maximum_plus_dsrgemm_nt_t_sm50.cu => sm50_simt_maximum_plus_dsrgemm_nt_t.cu} (100%) rename test/device/{simt_maximum_plus_dsrgemm_tn_n_sm50.cu => sm50_simt_maximum_plus_dsrgemm_tn_n.cu} (100%) rename test/device/{simt_maximum_plus_dsrgemm_tn_t_sm50.cu => sm50_simt_maximum_plus_dsrgemm_tn_t.cu} (100%) rename test/device/{simt_maximum_plus_dsrgemm_tt_n_sm50.cu => sm50_simt_maximum_plus_dsrgemm_tt_n.cu} (100%) rename test/device/{simt_maximum_plus_dsrgemm_tt_t_sm50.cu => sm50_simt_maximum_plus_dsrgemm_tt_t.cu} (100%) rename test/device/{simt_maximum_plus_ssrgemm_nn_n_sm50.cu => sm50_simt_maximum_plus_ssrgemm_nn_n.cu} (100%) rename test/device/{simt_maximum_plus_ssrgemm_nn_t_sm50.cu => sm50_simt_maximum_plus_ssrgemm_nn_t.cu} (100%) rename test/device/{simt_maximum_plus_ssrgemm_nt_n_sm50.cu => sm50_simt_maximum_plus_ssrgemm_nt_n.cu} (100%) rename test/device/{simt_maximum_plus_ssrgemm_nt_t_sm50.cu => sm50_simt_maximum_plus_ssrgemm_nt_t.cu} (100%) rename test/device/{simt_maximum_plus_ssrgemm_tn_n_sm50.cu => sm50_simt_maximum_plus_ssrgemm_tn_n.cu} (100%) rename test/device/{simt_maximum_plus_ssrgemm_tn_t_sm50.cu => sm50_simt_maximum_plus_ssrgemm_tn_t.cu} (100%) rename test/device/{simt_maximum_plus_ssrgemm_tt_n_sm50.cu => sm50_simt_maximum_plus_ssrgemm_tt_n.cu} (100%) rename test/device/{simt_maximum_plus_ssrgemm_tt_t_sm50.cu => sm50_simt_maximum_plus_ssrgemm_tt_t.cu} (100%) rename test/device/{simt_minimum_maximum_dsrgemm_nn_n_sm50.cu => sm50_simt_minimum_maximum_dsrgemm_nn_n.cu} (100%) rename test/device/{simt_minimum_maximum_dsrgemm_nn_t_sm50.cu => sm50_simt_minimum_maximum_dsrgemm_nn_t.cu} (100%) rename test/device/{simt_minimum_maximum_dsrgemm_nt_n_sm50.cu => sm50_simt_minimum_maximum_dsrgemm_nt_n.cu} (100%) rename test/device/{simt_minimum_maximum_dsrgemm_nt_t_sm50.cu => sm50_simt_minimum_maximum_dsrgemm_nt_t.cu} (100%) rename test/device/{simt_minimum_maximum_dsrgemm_tn_n_sm50.cu => sm50_simt_minimum_maximum_dsrgemm_tn_n.cu} (100%) rename test/device/{simt_minimum_maximum_dsrgemm_tn_t_sm50.cu => sm50_simt_minimum_maximum_dsrgemm_tn_t.cu} (100%) rename test/device/{simt_minimum_maximum_dsrgemm_tt_n_sm50.cu => sm50_simt_minimum_maximum_dsrgemm_tt_n.cu} (100%) rename test/device/{simt_minimum_maximum_dsrgemm_tt_t_sm50.cu => sm50_simt_minimum_maximum_dsrgemm_tt_t.cu} (100%) rename test/device/{simt_minimum_maximum_ssrgemm_nn_n_sm50.cu => sm50_simt_minimum_maximum_ssrgemm_nn_n.cu} (100%) rename test/device/{simt_minimum_maximum_ssrgemm_nn_t_sm50.cu => sm50_simt_minimum_maximum_ssrgemm_nn_t.cu} (100%) rename test/device/{simt_minimum_maximum_ssrgemm_nt_n_sm50.cu => sm50_simt_minimum_maximum_ssrgemm_nt_n.cu} (100%) rename test/device/{simt_minimum_maximum_ssrgemm_nt_t_sm50.cu => sm50_simt_minimum_maximum_ssrgemm_nt_t.cu} (100%) rename test/device/{simt_minimum_maximum_ssrgemm_tn_n_sm50.cu => sm50_simt_minimum_maximum_ssrgemm_tn_n.cu} (100%) rename test/device/{simt_minimum_maximum_ssrgemm_tn_t_sm50.cu => sm50_simt_minimum_maximum_ssrgemm_tn_t.cu} (100%) rename test/device/{simt_minimum_maximum_ssrgemm_tt_n_sm50.cu => sm50_simt_minimum_maximum_ssrgemm_tt_n.cu} (100%) rename test/device/{simt_minimum_maximum_ssrgemm_tt_t_sm50.cu => sm50_simt_minimum_maximum_ssrgemm_tt_t.cu} (100%) rename test/device/{simt_minimum_multiplies_dsrgemm_nn_n_sm50.cu => sm50_simt_minimum_multiplies_dsrgemm_nn_n.cu} (100%) rename test/device/{simt_minimum_multiplies_dsrgemm_nn_t_sm50.cu => sm50_simt_minimum_multiplies_dsrgemm_nn_t.cu} (100%) rename test/device/{simt_minimum_multiplies_dsrgemm_nt_n_sm50.cu => sm50_simt_minimum_multiplies_dsrgemm_nt_n.cu} (100%) rename test/device/{simt_minimum_multiplies_dsrgemm_nt_t_sm50.cu => sm50_simt_minimum_multiplies_dsrgemm_nt_t.cu} (100%) rename test/device/{simt_minimum_multiplies_dsrgemm_tn_n_sm50.cu => sm50_simt_minimum_multiplies_dsrgemm_tn_n.cu} (100%) rename test/device/{simt_minimum_multiplies_dsrgemm_tn_t_sm50.cu => sm50_simt_minimum_multiplies_dsrgemm_tn_t.cu} (100%) rename test/device/{simt_minimum_multiplies_dsrgemm_tt_n_sm50.cu => sm50_simt_minimum_multiplies_dsrgemm_tt_n.cu} (100%) rename test/device/{simt_minimum_multiplies_dsrgemm_tt_t_sm50.cu => sm50_simt_minimum_multiplies_dsrgemm_tt_t.cu} (100%) rename test/device/{simt_minimum_multiplies_ssrgemm_nn_n_sm50.cu => sm50_simt_minimum_multiplies_ssrgemm_nn_n.cu} (100%) rename test/device/{simt_minimum_multiplies_ssrgemm_nn_t_sm50.cu => sm50_simt_minimum_multiplies_ssrgemm_nn_t.cu} (100%) rename test/device/{simt_minimum_multiplies_ssrgemm_nt_n_sm50.cu => sm50_simt_minimum_multiplies_ssrgemm_nt_n.cu} (100%) rename test/device/{simt_minimum_multiplies_ssrgemm_nt_t_sm50.cu => sm50_simt_minimum_multiplies_ssrgemm_nt_t.cu} (100%) rename test/device/{simt_minimum_multiplies_ssrgemm_tn_n_sm50.cu => sm50_simt_minimum_multiplies_ssrgemm_tn_n.cu} (100%) rename test/device/{simt_minimum_multiplies_ssrgemm_tn_t_sm50.cu => sm50_simt_minimum_multiplies_ssrgemm_tn_t.cu} (100%) rename test/device/{simt_minimum_multiplies_ssrgemm_tt_n_sm50.cu => sm50_simt_minimum_multiplies_ssrgemm_tt_n.cu} (100%) rename test/device/{simt_minimum_multiplies_ssrgemm_tt_t_sm50.cu => sm50_simt_minimum_multiplies_ssrgemm_tt_t.cu} (100%) rename test/device/{simt_minimum_plus_dsrgemm_nn_n_sm50.cu => sm50_simt_minimum_plus_dsrgemm_nn_n.cu} (100%) rename test/device/{simt_minimum_plus_dsrgemm_nn_t_sm50.cu => sm50_simt_minimum_plus_dsrgemm_nn_t.cu} (100%) rename test/device/{simt_minimum_plus_dsrgemm_nt_n_sm50.cu => sm50_simt_minimum_plus_dsrgemm_nt_n.cu} (100%) rename test/device/{simt_minimum_plus_dsrgemm_nt_t_sm50.cu => sm50_simt_minimum_plus_dsrgemm_nt_t.cu} (100%) rename test/device/{simt_minimum_plus_dsrgemm_tn_n_sm50.cu => sm50_simt_minimum_plus_dsrgemm_tn_n.cu} (100%) rename test/device/{simt_minimum_plus_dsrgemm_tn_t_sm50.cu => sm50_simt_minimum_plus_dsrgemm_tn_t.cu} (100%) rename test/device/{simt_minimum_plus_dsrgemm_tt_n_sm50.cu => sm50_simt_minimum_plus_dsrgemm_tt_n.cu} (100%) rename test/device/{simt_minimum_plus_dsrgemm_tt_t_sm50.cu => sm50_simt_minimum_plus_dsrgemm_tt_t.cu} (100%) rename test/device/{simt_minimum_plus_ssrgemm_nn_n_sm50.cu => sm50_simt_minimum_plus_ssrgemm_nn_n.cu} (100%) rename test/device/{simt_minimum_plus_ssrgemm_nn_t_sm50.cu => sm50_simt_minimum_plus_ssrgemm_nn_t.cu} (100%) rename test/device/{simt_minimum_plus_ssrgemm_nt_n_sm50.cu => sm50_simt_minimum_plus_ssrgemm_nt_n.cu} (100%) rename test/device/{simt_minimum_plus_ssrgemm_nt_t_sm50.cu => sm50_simt_minimum_plus_ssrgemm_nt_t.cu} (100%) rename test/device/{simt_minimum_plus_ssrgemm_tn_n_sm50.cu => sm50_simt_minimum_plus_ssrgemm_tn_n.cu} (100%) rename test/device/{simt_minimum_plus_ssrgemm_tn_t_sm50.cu => sm50_simt_minimum_plus_ssrgemm_tn_t.cu} (100%) rename test/device/{simt_minimum_plus_ssrgemm_tt_n_sm50.cu => sm50_simt_minimum_plus_ssrgemm_tt_n.cu} (100%) rename test/device/{simt_minimum_plus_ssrgemm_tt_t_sm50.cu => sm50_simt_minimum_plus_ssrgemm_tt_t.cu} (100%) rename test/device/{simt_plus_multiplies_dsrgemm_nn_n_sm50.cu => sm50_simt_plus_multiplies_dsrgemm_nn_n.cu} (100%) rename test/device/{simt_plus_multiplies_dsrgemm_nn_t_sm50.cu => sm50_simt_plus_multiplies_dsrgemm_nn_t.cu} (100%) rename test/device/{simt_plus_multiplies_dsrgemm_nt_n_sm50.cu => sm50_simt_plus_multiplies_dsrgemm_nt_n.cu} (100%) rename test/device/{simt_plus_multiplies_dsrgemm_nt_t_sm50.cu => sm50_simt_plus_multiplies_dsrgemm_nt_t.cu} (100%) rename test/device/{simt_plus_multiplies_dsrgemm_tn_n_sm50.cu => sm50_simt_plus_multiplies_dsrgemm_tn_n.cu} (100%) rename test/device/{simt_plus_multiplies_dsrgemm_tn_t_sm50.cu => sm50_simt_plus_multiplies_dsrgemm_tn_t.cu} (100%) rename test/device/{simt_plus_multiplies_dsrgemm_tt_n_sm50.cu => sm50_simt_plus_multiplies_dsrgemm_tt_n.cu} (100%) rename test/device/{simt_plus_multiplies_dsrgemm_tt_t_sm50.cu => sm50_simt_plus_multiplies_dsrgemm_tt_t.cu} (100%) rename test/device/{simt_plus_multiplies_ssrgemm_nn_n_sm50.cu => sm50_simt_plus_multiplies_ssrgemm_nn_n.cu} (100%) rename test/device/{simt_plus_multiplies_ssrgemm_nn_t_sm50.cu => sm50_simt_plus_multiplies_ssrgemm_nn_t.cu} (100%) rename test/device/{simt_plus_multiplies_ssrgemm_nt_n_sm50.cu => sm50_simt_plus_multiplies_ssrgemm_nt_n.cu} (100%) rename test/device/{simt_plus_multiplies_ssrgemm_nt_t_sm50.cu => sm50_simt_plus_multiplies_ssrgemm_nt_t.cu} (100%) rename test/device/{simt_plus_multiplies_ssrgemm_tn_n_sm50.cu => sm50_simt_plus_multiplies_ssrgemm_tn_n.cu} (100%) rename test/device/{simt_plus_multiplies_ssrgemm_tn_t_sm50.cu => sm50_simt_plus_multiplies_ssrgemm_tn_t.cu} (100%) rename test/device/{simt_plus_multiplies_ssrgemm_tt_n_sm50.cu => sm50_simt_plus_multiplies_ssrgemm_tt_n.cu} (100%) rename test/device/{simt_plus_multiplies_ssrgemm_tt_t_sm50.cu => sm50_simt_plus_multiplies_ssrgemm_tt_t.cu} (100%) diff --git a/test/device/simt_sm50.py b/test/device/gen_simt.py similarity index 93% rename from test/device/simt_sm50.py rename to test/device/gen_simt.py index 1339891..52678f0 100644 --- a/test/device/simt_sm50.py +++ b/test/device/gen_simt.py @@ -1,4 +1,6 @@ import os +import sys +import argparse # this file creates the test/unit/gemm/device simt tests and the CMake file to go with it ################################################################################ @@ -92,10 +94,10 @@ test_template = """\ #if defined(CUASR_TEST_LEVEL) and (CUASR_TEST_LEVEL >= {21}) -TEST(SM50_device_{0}_{1}_{2}srgemm_{4}{5}_{6}, {10}x{11}x{12}_{13}x{14}x1_{15}x{16}_{17}x{18}_{19}x{20}) {{ +TEST(SM{22}_device_{0}_{1}_{2}srgemm_{4}{5}_{6}, {10}x{11}x{12}_{13}x{14}x1_{15}x{16}_{17}x{18}_{19}x{20}) {{ using precision = {3}; using OpClass = cutlass::arch::OpClassSimt; - using SmArch = cutlass::arch::Sm50; + using SmArch = cutlass::arch::Sm{22}; using ThreadblockShape = cutlass::gemm::GemmShape<{10}, {11}, {12}>; using WarpShape = cutlass::gemm::GemmShape<{13}, {14}, {12}>; @@ -146,7 +148,8 @@ def write_test_to_file( warp_threadsM, warp_threadsN, warps_per_tb, - test_level): + test_level, + sm_arch): print("{:.0f}x{:.0f}x{:.0f}__{:.0f}x{:.0f}_{:.0f}x{:.0f}_{:.0f}x{:.0f}".format( threadblock_tile[0], threadblock_tile[1], unroll, thread_tileM, thread_tileN, @@ -186,11 +189,12 @@ def write_test_to_file( int(warp_threadsN), # 18 int(warps_per_tb[0]), # 19 int(warps_per_tb[1]), # 20 - int(test_level) # 21 + int(test_level), # 21 + int(sm_arch) # 22 )) -def main(output_dir: str): +def main(args): # warps per threadblock warps_per_threadblocks = [] for warps_per_tb0 in WARPS_PER_TB_EDGE: @@ -242,12 +246,12 @@ def main(output_dir: str): transC = "n" if column_major_C else "t" # open file - testfile_name = "simt_{}_{}_{}srgemm_{}{}_{}_sm50.cu".format( - add_op, mult_op, precision_char, + testfile_name = "sm{}_simt_{}_{}_{}srgemm_{}{}_{}.cu".format( + args.sm_arch, add_op, mult_op, precision_char, transA, transB, transC) print("\n", testfile_name) - filePath = os.path.join(output_dir, testfile_name) + filePath = os.path.join(args.output_dir, testfile_name) with open(filePath, "w") as testfile: write_test_file_header(testfile) @@ -362,10 +366,17 @@ def main(output_dir: str): warp_threadsM, warp_threadsN, warps_per_tb, - test_level) + test_level, + args.sm_arch) num_tests += 1 print("Total test count per semi-ring = {}".format(num_tests//len(semiring_operators))) if __name__ == "__main__": - main(".") + parser = argparse.ArgumentParser() + parser.add_argument("-o", "--output-dir", type=str, required=False, default=".", + help="Path to the output dir.") + parser.add_argument("-sm", "--sm-arch", type=int, required=False, default=50, choices=[50, 80], + help="SM architecture version number,") + args = parser.parse_args(sys.argv[1:]) + main(args) diff --git a/test/device/simt_binary_or_binary_and_dsrgemm_nn_n_sm50.cu b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_n.cu similarity index 100% rename from test/device/simt_binary_or_binary_and_dsrgemm_nn_n_sm50.cu rename to test/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_n.cu diff --git a/test/device/simt_binary_or_binary_and_dsrgemm_nn_t_sm50.cu b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_t.cu similarity index 100% rename from test/device/simt_binary_or_binary_and_dsrgemm_nn_t_sm50.cu rename to test/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_t.cu diff --git a/test/device/simt_binary_or_binary_and_dsrgemm_nt_n_sm50.cu b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_n.cu similarity index 100% rename from test/device/simt_binary_or_binary_and_dsrgemm_nt_n_sm50.cu rename to test/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_n.cu diff --git a/test/device/simt_binary_or_binary_and_dsrgemm_nt_t_sm50.cu b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_t.cu similarity index 100% rename from test/device/simt_binary_or_binary_and_dsrgemm_nt_t_sm50.cu rename to test/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_t.cu diff --git a/test/device/simt_binary_or_binary_and_dsrgemm_tn_n_sm50.cu b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_n.cu similarity index 100% rename from test/device/simt_binary_or_binary_and_dsrgemm_tn_n_sm50.cu rename to test/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_n.cu diff --git a/test/device/simt_binary_or_binary_and_dsrgemm_tn_t_sm50.cu b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_t.cu similarity index 100% rename from test/device/simt_binary_or_binary_and_dsrgemm_tn_t_sm50.cu rename to test/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_t.cu diff --git a/test/device/simt_binary_or_binary_and_dsrgemm_tt_n_sm50.cu b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_n.cu similarity index 100% rename from test/device/simt_binary_or_binary_and_dsrgemm_tt_n_sm50.cu rename to test/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_n.cu diff --git a/test/device/simt_binary_or_binary_and_dsrgemm_tt_t_sm50.cu b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_t.cu similarity index 100% rename from test/device/simt_binary_or_binary_and_dsrgemm_tt_t_sm50.cu rename to test/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_t.cu diff --git a/test/device/simt_binary_or_binary_and_ssrgemm_nn_n_sm50.cu b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_n.cu similarity index 100% rename from test/device/simt_binary_or_binary_and_ssrgemm_nn_n_sm50.cu rename to test/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_n.cu diff --git a/test/device/simt_binary_or_binary_and_ssrgemm_nn_t_sm50.cu b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_t.cu similarity index 100% rename from test/device/simt_binary_or_binary_and_ssrgemm_nn_t_sm50.cu rename to test/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_t.cu diff --git a/test/device/simt_binary_or_binary_and_ssrgemm_nt_n_sm50.cu b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_n.cu similarity index 100% rename from test/device/simt_binary_or_binary_and_ssrgemm_nt_n_sm50.cu rename to test/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_n.cu diff --git a/test/device/simt_binary_or_binary_and_ssrgemm_nt_t_sm50.cu b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_t.cu similarity index 100% rename from test/device/simt_binary_or_binary_and_ssrgemm_nt_t_sm50.cu rename to test/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_t.cu diff --git a/test/device/simt_binary_or_binary_and_ssrgemm_tn_n_sm50.cu b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_n.cu similarity index 100% rename from test/device/simt_binary_or_binary_and_ssrgemm_tn_n_sm50.cu rename to test/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_n.cu diff --git a/test/device/simt_binary_or_binary_and_ssrgemm_tn_t_sm50.cu b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_t.cu similarity index 100% rename from test/device/simt_binary_or_binary_and_ssrgemm_tn_t_sm50.cu rename to test/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_t.cu diff --git a/test/device/simt_binary_or_binary_and_ssrgemm_tt_n_sm50.cu b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_n.cu similarity index 100% rename from test/device/simt_binary_or_binary_and_ssrgemm_tt_n_sm50.cu rename to test/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_n.cu diff --git a/test/device/simt_binary_or_binary_and_ssrgemm_tt_t_sm50.cu b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_t.cu similarity index 100% rename from test/device/simt_binary_or_binary_and_ssrgemm_tt_t_sm50.cu rename to test/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_t.cu diff --git a/test/device/simt_maximum_minimum_dsrgemm_nn_n_sm50.cu b/test/device/sm50_simt_maximum_minimum_dsrgemm_nn_n.cu similarity index 100% rename from test/device/simt_maximum_minimum_dsrgemm_nn_n_sm50.cu rename to test/device/sm50_simt_maximum_minimum_dsrgemm_nn_n.cu diff --git a/test/device/simt_maximum_minimum_dsrgemm_nn_t_sm50.cu b/test/device/sm50_simt_maximum_minimum_dsrgemm_nn_t.cu similarity index 100% rename from test/device/simt_maximum_minimum_dsrgemm_nn_t_sm50.cu rename to test/device/sm50_simt_maximum_minimum_dsrgemm_nn_t.cu diff --git a/test/device/simt_maximum_minimum_dsrgemm_nt_n_sm50.cu b/test/device/sm50_simt_maximum_minimum_dsrgemm_nt_n.cu similarity index 100% rename from test/device/simt_maximum_minimum_dsrgemm_nt_n_sm50.cu rename to test/device/sm50_simt_maximum_minimum_dsrgemm_nt_n.cu diff --git a/test/device/simt_maximum_minimum_dsrgemm_nt_t_sm50.cu b/test/device/sm50_simt_maximum_minimum_dsrgemm_nt_t.cu similarity index 100% rename from test/device/simt_maximum_minimum_dsrgemm_nt_t_sm50.cu rename to test/device/sm50_simt_maximum_minimum_dsrgemm_nt_t.cu diff --git a/test/device/simt_maximum_minimum_dsrgemm_tn_n_sm50.cu b/test/device/sm50_simt_maximum_minimum_dsrgemm_tn_n.cu similarity index 100% rename from test/device/simt_maximum_minimum_dsrgemm_tn_n_sm50.cu rename to test/device/sm50_simt_maximum_minimum_dsrgemm_tn_n.cu diff --git a/test/device/simt_maximum_minimum_dsrgemm_tn_t_sm50.cu b/test/device/sm50_simt_maximum_minimum_dsrgemm_tn_t.cu similarity index 100% rename from test/device/simt_maximum_minimum_dsrgemm_tn_t_sm50.cu rename to test/device/sm50_simt_maximum_minimum_dsrgemm_tn_t.cu diff --git a/test/device/simt_maximum_minimum_dsrgemm_tt_n_sm50.cu b/test/device/sm50_simt_maximum_minimum_dsrgemm_tt_n.cu similarity index 100% rename from test/device/simt_maximum_minimum_dsrgemm_tt_n_sm50.cu rename to test/device/sm50_simt_maximum_minimum_dsrgemm_tt_n.cu diff --git a/test/device/simt_maximum_minimum_dsrgemm_tt_t_sm50.cu b/test/device/sm50_simt_maximum_minimum_dsrgemm_tt_t.cu similarity index 100% rename from test/device/simt_maximum_minimum_dsrgemm_tt_t_sm50.cu rename to test/device/sm50_simt_maximum_minimum_dsrgemm_tt_t.cu diff --git a/test/device/simt_maximum_minimum_ssrgemm_nn_n_sm50.cu b/test/device/sm50_simt_maximum_minimum_ssrgemm_nn_n.cu similarity index 100% rename from test/device/simt_maximum_minimum_ssrgemm_nn_n_sm50.cu rename to test/device/sm50_simt_maximum_minimum_ssrgemm_nn_n.cu diff --git a/test/device/simt_maximum_minimum_ssrgemm_nn_t_sm50.cu b/test/device/sm50_simt_maximum_minimum_ssrgemm_nn_t.cu similarity index 100% rename from test/device/simt_maximum_minimum_ssrgemm_nn_t_sm50.cu rename to test/device/sm50_simt_maximum_minimum_ssrgemm_nn_t.cu diff --git a/test/device/simt_maximum_minimum_ssrgemm_nt_n_sm50.cu b/test/device/sm50_simt_maximum_minimum_ssrgemm_nt_n.cu similarity index 100% rename from test/device/simt_maximum_minimum_ssrgemm_nt_n_sm50.cu rename to test/device/sm50_simt_maximum_minimum_ssrgemm_nt_n.cu diff --git a/test/device/simt_maximum_minimum_ssrgemm_nt_t_sm50.cu b/test/device/sm50_simt_maximum_minimum_ssrgemm_nt_t.cu similarity index 100% rename from test/device/simt_maximum_minimum_ssrgemm_nt_t_sm50.cu rename to test/device/sm50_simt_maximum_minimum_ssrgemm_nt_t.cu diff --git a/test/device/simt_maximum_minimum_ssrgemm_tn_n_sm50.cu b/test/device/sm50_simt_maximum_minimum_ssrgemm_tn_n.cu similarity index 100% rename from test/device/simt_maximum_minimum_ssrgemm_tn_n_sm50.cu rename to test/device/sm50_simt_maximum_minimum_ssrgemm_tn_n.cu diff --git a/test/device/simt_maximum_minimum_ssrgemm_tn_t_sm50.cu b/test/device/sm50_simt_maximum_minimum_ssrgemm_tn_t.cu similarity index 100% rename from test/device/simt_maximum_minimum_ssrgemm_tn_t_sm50.cu rename to test/device/sm50_simt_maximum_minimum_ssrgemm_tn_t.cu diff --git a/test/device/simt_maximum_minimum_ssrgemm_tt_n_sm50.cu b/test/device/sm50_simt_maximum_minimum_ssrgemm_tt_n.cu similarity index 100% rename from test/device/simt_maximum_minimum_ssrgemm_tt_n_sm50.cu rename to test/device/sm50_simt_maximum_minimum_ssrgemm_tt_n.cu diff --git a/test/device/simt_maximum_minimum_ssrgemm_tt_t_sm50.cu b/test/device/sm50_simt_maximum_minimum_ssrgemm_tt_t.cu similarity index 100% rename from test/device/simt_maximum_minimum_ssrgemm_tt_t_sm50.cu rename to test/device/sm50_simt_maximum_minimum_ssrgemm_tt_t.cu diff --git a/test/device/simt_maximum_multiplies_dsrgemm_nn_n_sm50.cu b/test/device/sm50_simt_maximum_multiplies_dsrgemm_nn_n.cu similarity index 100% rename from test/device/simt_maximum_multiplies_dsrgemm_nn_n_sm50.cu rename to test/device/sm50_simt_maximum_multiplies_dsrgemm_nn_n.cu diff --git a/test/device/simt_maximum_multiplies_dsrgemm_nn_t_sm50.cu b/test/device/sm50_simt_maximum_multiplies_dsrgemm_nn_t.cu similarity index 100% rename from test/device/simt_maximum_multiplies_dsrgemm_nn_t_sm50.cu rename to test/device/sm50_simt_maximum_multiplies_dsrgemm_nn_t.cu diff --git a/test/device/simt_maximum_multiplies_dsrgemm_nt_n_sm50.cu b/test/device/sm50_simt_maximum_multiplies_dsrgemm_nt_n.cu similarity index 100% rename from test/device/simt_maximum_multiplies_dsrgemm_nt_n_sm50.cu rename to test/device/sm50_simt_maximum_multiplies_dsrgemm_nt_n.cu diff --git a/test/device/simt_maximum_multiplies_dsrgemm_nt_t_sm50.cu b/test/device/sm50_simt_maximum_multiplies_dsrgemm_nt_t.cu similarity index 100% rename from test/device/simt_maximum_multiplies_dsrgemm_nt_t_sm50.cu rename to test/device/sm50_simt_maximum_multiplies_dsrgemm_nt_t.cu diff --git a/test/device/simt_maximum_multiplies_dsrgemm_tn_n_sm50.cu b/test/device/sm50_simt_maximum_multiplies_dsrgemm_tn_n.cu similarity index 100% rename from test/device/simt_maximum_multiplies_dsrgemm_tn_n_sm50.cu rename to test/device/sm50_simt_maximum_multiplies_dsrgemm_tn_n.cu diff --git a/test/device/simt_maximum_multiplies_dsrgemm_tn_t_sm50.cu b/test/device/sm50_simt_maximum_multiplies_dsrgemm_tn_t.cu similarity index 100% rename from test/device/simt_maximum_multiplies_dsrgemm_tn_t_sm50.cu rename to test/device/sm50_simt_maximum_multiplies_dsrgemm_tn_t.cu diff --git a/test/device/simt_maximum_multiplies_dsrgemm_tt_n_sm50.cu b/test/device/sm50_simt_maximum_multiplies_dsrgemm_tt_n.cu similarity index 100% rename from test/device/simt_maximum_multiplies_dsrgemm_tt_n_sm50.cu rename to test/device/sm50_simt_maximum_multiplies_dsrgemm_tt_n.cu diff --git a/test/device/simt_maximum_multiplies_dsrgemm_tt_t_sm50.cu b/test/device/sm50_simt_maximum_multiplies_dsrgemm_tt_t.cu similarity index 100% rename from test/device/simt_maximum_multiplies_dsrgemm_tt_t_sm50.cu rename to test/device/sm50_simt_maximum_multiplies_dsrgemm_tt_t.cu diff --git a/test/device/simt_maximum_multiplies_ssrgemm_nn_n_sm50.cu b/test/device/sm50_simt_maximum_multiplies_ssrgemm_nn_n.cu similarity index 100% rename from test/device/simt_maximum_multiplies_ssrgemm_nn_n_sm50.cu rename to test/device/sm50_simt_maximum_multiplies_ssrgemm_nn_n.cu diff --git a/test/device/simt_maximum_multiplies_ssrgemm_nn_t_sm50.cu b/test/device/sm50_simt_maximum_multiplies_ssrgemm_nn_t.cu similarity index 100% rename from test/device/simt_maximum_multiplies_ssrgemm_nn_t_sm50.cu rename to test/device/sm50_simt_maximum_multiplies_ssrgemm_nn_t.cu diff --git a/test/device/simt_maximum_multiplies_ssrgemm_nt_n_sm50.cu b/test/device/sm50_simt_maximum_multiplies_ssrgemm_nt_n.cu similarity index 100% rename from test/device/simt_maximum_multiplies_ssrgemm_nt_n_sm50.cu rename to test/device/sm50_simt_maximum_multiplies_ssrgemm_nt_n.cu diff --git a/test/device/simt_maximum_multiplies_ssrgemm_nt_t_sm50.cu b/test/device/sm50_simt_maximum_multiplies_ssrgemm_nt_t.cu similarity index 100% rename from test/device/simt_maximum_multiplies_ssrgemm_nt_t_sm50.cu rename to test/device/sm50_simt_maximum_multiplies_ssrgemm_nt_t.cu diff --git a/test/device/simt_maximum_multiplies_ssrgemm_tn_n_sm50.cu b/test/device/sm50_simt_maximum_multiplies_ssrgemm_tn_n.cu similarity index 100% rename from test/device/simt_maximum_multiplies_ssrgemm_tn_n_sm50.cu rename to test/device/sm50_simt_maximum_multiplies_ssrgemm_tn_n.cu diff --git a/test/device/simt_maximum_multiplies_ssrgemm_tn_t_sm50.cu b/test/device/sm50_simt_maximum_multiplies_ssrgemm_tn_t.cu similarity index 100% rename from test/device/simt_maximum_multiplies_ssrgemm_tn_t_sm50.cu rename to test/device/sm50_simt_maximum_multiplies_ssrgemm_tn_t.cu diff --git a/test/device/simt_maximum_multiplies_ssrgemm_tt_n_sm50.cu b/test/device/sm50_simt_maximum_multiplies_ssrgemm_tt_n.cu similarity index 100% rename from test/device/simt_maximum_multiplies_ssrgemm_tt_n_sm50.cu rename to test/device/sm50_simt_maximum_multiplies_ssrgemm_tt_n.cu diff --git a/test/device/simt_maximum_multiplies_ssrgemm_tt_t_sm50.cu b/test/device/sm50_simt_maximum_multiplies_ssrgemm_tt_t.cu similarity index 100% rename from test/device/simt_maximum_multiplies_ssrgemm_tt_t_sm50.cu rename to test/device/sm50_simt_maximum_multiplies_ssrgemm_tt_t.cu diff --git a/test/device/simt_maximum_plus_dsrgemm_nn_n_sm50.cu b/test/device/sm50_simt_maximum_plus_dsrgemm_nn_n.cu similarity index 100% rename from test/device/simt_maximum_plus_dsrgemm_nn_n_sm50.cu rename to test/device/sm50_simt_maximum_plus_dsrgemm_nn_n.cu diff --git a/test/device/simt_maximum_plus_dsrgemm_nn_t_sm50.cu b/test/device/sm50_simt_maximum_plus_dsrgemm_nn_t.cu similarity index 100% rename from test/device/simt_maximum_plus_dsrgemm_nn_t_sm50.cu rename to test/device/sm50_simt_maximum_plus_dsrgemm_nn_t.cu diff --git a/test/device/simt_maximum_plus_dsrgemm_nt_n_sm50.cu b/test/device/sm50_simt_maximum_plus_dsrgemm_nt_n.cu similarity index 100% rename from test/device/simt_maximum_plus_dsrgemm_nt_n_sm50.cu rename to test/device/sm50_simt_maximum_plus_dsrgemm_nt_n.cu diff --git a/test/device/simt_maximum_plus_dsrgemm_nt_t_sm50.cu b/test/device/sm50_simt_maximum_plus_dsrgemm_nt_t.cu similarity index 100% rename from test/device/simt_maximum_plus_dsrgemm_nt_t_sm50.cu rename to test/device/sm50_simt_maximum_plus_dsrgemm_nt_t.cu diff --git a/test/device/simt_maximum_plus_dsrgemm_tn_n_sm50.cu b/test/device/sm50_simt_maximum_plus_dsrgemm_tn_n.cu similarity index 100% rename from test/device/simt_maximum_plus_dsrgemm_tn_n_sm50.cu rename to test/device/sm50_simt_maximum_plus_dsrgemm_tn_n.cu diff --git a/test/device/simt_maximum_plus_dsrgemm_tn_t_sm50.cu b/test/device/sm50_simt_maximum_plus_dsrgemm_tn_t.cu similarity index 100% rename from test/device/simt_maximum_plus_dsrgemm_tn_t_sm50.cu rename to test/device/sm50_simt_maximum_plus_dsrgemm_tn_t.cu diff --git a/test/device/simt_maximum_plus_dsrgemm_tt_n_sm50.cu b/test/device/sm50_simt_maximum_plus_dsrgemm_tt_n.cu similarity index 100% rename from test/device/simt_maximum_plus_dsrgemm_tt_n_sm50.cu rename to test/device/sm50_simt_maximum_plus_dsrgemm_tt_n.cu diff --git a/test/device/simt_maximum_plus_dsrgemm_tt_t_sm50.cu b/test/device/sm50_simt_maximum_plus_dsrgemm_tt_t.cu similarity index 100% rename from test/device/simt_maximum_plus_dsrgemm_tt_t_sm50.cu rename to test/device/sm50_simt_maximum_plus_dsrgemm_tt_t.cu diff --git a/test/device/simt_maximum_plus_ssrgemm_nn_n_sm50.cu b/test/device/sm50_simt_maximum_plus_ssrgemm_nn_n.cu similarity index 100% rename from test/device/simt_maximum_plus_ssrgemm_nn_n_sm50.cu rename to test/device/sm50_simt_maximum_plus_ssrgemm_nn_n.cu diff --git a/test/device/simt_maximum_plus_ssrgemm_nn_t_sm50.cu b/test/device/sm50_simt_maximum_plus_ssrgemm_nn_t.cu similarity index 100% rename from test/device/simt_maximum_plus_ssrgemm_nn_t_sm50.cu rename to test/device/sm50_simt_maximum_plus_ssrgemm_nn_t.cu diff --git a/test/device/simt_maximum_plus_ssrgemm_nt_n_sm50.cu b/test/device/sm50_simt_maximum_plus_ssrgemm_nt_n.cu similarity index 100% rename from test/device/simt_maximum_plus_ssrgemm_nt_n_sm50.cu rename to test/device/sm50_simt_maximum_plus_ssrgemm_nt_n.cu diff --git a/test/device/simt_maximum_plus_ssrgemm_nt_t_sm50.cu b/test/device/sm50_simt_maximum_plus_ssrgemm_nt_t.cu similarity index 100% rename from test/device/simt_maximum_plus_ssrgemm_nt_t_sm50.cu rename to test/device/sm50_simt_maximum_plus_ssrgemm_nt_t.cu diff --git a/test/device/simt_maximum_plus_ssrgemm_tn_n_sm50.cu b/test/device/sm50_simt_maximum_plus_ssrgemm_tn_n.cu similarity index 100% rename from test/device/simt_maximum_plus_ssrgemm_tn_n_sm50.cu rename to test/device/sm50_simt_maximum_plus_ssrgemm_tn_n.cu diff --git a/test/device/simt_maximum_plus_ssrgemm_tn_t_sm50.cu b/test/device/sm50_simt_maximum_plus_ssrgemm_tn_t.cu similarity index 100% rename from test/device/simt_maximum_plus_ssrgemm_tn_t_sm50.cu rename to test/device/sm50_simt_maximum_plus_ssrgemm_tn_t.cu diff --git a/test/device/simt_maximum_plus_ssrgemm_tt_n_sm50.cu b/test/device/sm50_simt_maximum_plus_ssrgemm_tt_n.cu similarity index 100% rename from test/device/simt_maximum_plus_ssrgemm_tt_n_sm50.cu rename to test/device/sm50_simt_maximum_plus_ssrgemm_tt_n.cu diff --git a/test/device/simt_maximum_plus_ssrgemm_tt_t_sm50.cu b/test/device/sm50_simt_maximum_plus_ssrgemm_tt_t.cu similarity index 100% rename from test/device/simt_maximum_plus_ssrgemm_tt_t_sm50.cu rename to test/device/sm50_simt_maximum_plus_ssrgemm_tt_t.cu diff --git a/test/device/simt_minimum_maximum_dsrgemm_nn_n_sm50.cu b/test/device/sm50_simt_minimum_maximum_dsrgemm_nn_n.cu similarity index 100% rename from test/device/simt_minimum_maximum_dsrgemm_nn_n_sm50.cu rename to test/device/sm50_simt_minimum_maximum_dsrgemm_nn_n.cu diff --git a/test/device/simt_minimum_maximum_dsrgemm_nn_t_sm50.cu b/test/device/sm50_simt_minimum_maximum_dsrgemm_nn_t.cu similarity index 100% rename from test/device/simt_minimum_maximum_dsrgemm_nn_t_sm50.cu rename to test/device/sm50_simt_minimum_maximum_dsrgemm_nn_t.cu diff --git a/test/device/simt_minimum_maximum_dsrgemm_nt_n_sm50.cu b/test/device/sm50_simt_minimum_maximum_dsrgemm_nt_n.cu similarity index 100% rename from test/device/simt_minimum_maximum_dsrgemm_nt_n_sm50.cu rename to test/device/sm50_simt_minimum_maximum_dsrgemm_nt_n.cu diff --git a/test/device/simt_minimum_maximum_dsrgemm_nt_t_sm50.cu b/test/device/sm50_simt_minimum_maximum_dsrgemm_nt_t.cu similarity index 100% rename from test/device/simt_minimum_maximum_dsrgemm_nt_t_sm50.cu rename to test/device/sm50_simt_minimum_maximum_dsrgemm_nt_t.cu diff --git a/test/device/simt_minimum_maximum_dsrgemm_tn_n_sm50.cu b/test/device/sm50_simt_minimum_maximum_dsrgemm_tn_n.cu similarity index 100% rename from test/device/simt_minimum_maximum_dsrgemm_tn_n_sm50.cu rename to test/device/sm50_simt_minimum_maximum_dsrgemm_tn_n.cu diff --git a/test/device/simt_minimum_maximum_dsrgemm_tn_t_sm50.cu b/test/device/sm50_simt_minimum_maximum_dsrgemm_tn_t.cu similarity index 100% rename from test/device/simt_minimum_maximum_dsrgemm_tn_t_sm50.cu rename to test/device/sm50_simt_minimum_maximum_dsrgemm_tn_t.cu diff --git a/test/device/simt_minimum_maximum_dsrgemm_tt_n_sm50.cu b/test/device/sm50_simt_minimum_maximum_dsrgemm_tt_n.cu similarity index 100% rename from test/device/simt_minimum_maximum_dsrgemm_tt_n_sm50.cu rename to test/device/sm50_simt_minimum_maximum_dsrgemm_tt_n.cu diff --git a/test/device/simt_minimum_maximum_dsrgemm_tt_t_sm50.cu b/test/device/sm50_simt_minimum_maximum_dsrgemm_tt_t.cu similarity index 100% rename from test/device/simt_minimum_maximum_dsrgemm_tt_t_sm50.cu rename to test/device/sm50_simt_minimum_maximum_dsrgemm_tt_t.cu diff --git a/test/device/simt_minimum_maximum_ssrgemm_nn_n_sm50.cu b/test/device/sm50_simt_minimum_maximum_ssrgemm_nn_n.cu similarity index 100% rename from test/device/simt_minimum_maximum_ssrgemm_nn_n_sm50.cu rename to test/device/sm50_simt_minimum_maximum_ssrgemm_nn_n.cu diff --git a/test/device/simt_minimum_maximum_ssrgemm_nn_t_sm50.cu b/test/device/sm50_simt_minimum_maximum_ssrgemm_nn_t.cu similarity index 100% rename from test/device/simt_minimum_maximum_ssrgemm_nn_t_sm50.cu rename to test/device/sm50_simt_minimum_maximum_ssrgemm_nn_t.cu diff --git a/test/device/simt_minimum_maximum_ssrgemm_nt_n_sm50.cu b/test/device/sm50_simt_minimum_maximum_ssrgemm_nt_n.cu similarity index 100% rename from test/device/simt_minimum_maximum_ssrgemm_nt_n_sm50.cu rename to test/device/sm50_simt_minimum_maximum_ssrgemm_nt_n.cu diff --git a/test/device/simt_minimum_maximum_ssrgemm_nt_t_sm50.cu b/test/device/sm50_simt_minimum_maximum_ssrgemm_nt_t.cu similarity index 100% rename from test/device/simt_minimum_maximum_ssrgemm_nt_t_sm50.cu rename to test/device/sm50_simt_minimum_maximum_ssrgemm_nt_t.cu diff --git a/test/device/simt_minimum_maximum_ssrgemm_tn_n_sm50.cu b/test/device/sm50_simt_minimum_maximum_ssrgemm_tn_n.cu similarity index 100% rename from test/device/simt_minimum_maximum_ssrgemm_tn_n_sm50.cu rename to test/device/sm50_simt_minimum_maximum_ssrgemm_tn_n.cu diff --git a/test/device/simt_minimum_maximum_ssrgemm_tn_t_sm50.cu b/test/device/sm50_simt_minimum_maximum_ssrgemm_tn_t.cu similarity index 100% rename from test/device/simt_minimum_maximum_ssrgemm_tn_t_sm50.cu rename to test/device/sm50_simt_minimum_maximum_ssrgemm_tn_t.cu diff --git a/test/device/simt_minimum_maximum_ssrgemm_tt_n_sm50.cu b/test/device/sm50_simt_minimum_maximum_ssrgemm_tt_n.cu similarity index 100% rename from test/device/simt_minimum_maximum_ssrgemm_tt_n_sm50.cu rename to test/device/sm50_simt_minimum_maximum_ssrgemm_tt_n.cu diff --git a/test/device/simt_minimum_maximum_ssrgemm_tt_t_sm50.cu b/test/device/sm50_simt_minimum_maximum_ssrgemm_tt_t.cu similarity index 100% rename from test/device/simt_minimum_maximum_ssrgemm_tt_t_sm50.cu rename to test/device/sm50_simt_minimum_maximum_ssrgemm_tt_t.cu diff --git a/test/device/simt_minimum_multiplies_dsrgemm_nn_n_sm50.cu b/test/device/sm50_simt_minimum_multiplies_dsrgemm_nn_n.cu similarity index 100% rename from test/device/simt_minimum_multiplies_dsrgemm_nn_n_sm50.cu rename to test/device/sm50_simt_minimum_multiplies_dsrgemm_nn_n.cu diff --git a/test/device/simt_minimum_multiplies_dsrgemm_nn_t_sm50.cu b/test/device/sm50_simt_minimum_multiplies_dsrgemm_nn_t.cu similarity index 100% rename from test/device/simt_minimum_multiplies_dsrgemm_nn_t_sm50.cu rename to test/device/sm50_simt_minimum_multiplies_dsrgemm_nn_t.cu diff --git a/test/device/simt_minimum_multiplies_dsrgemm_nt_n_sm50.cu b/test/device/sm50_simt_minimum_multiplies_dsrgemm_nt_n.cu similarity index 100% rename from test/device/simt_minimum_multiplies_dsrgemm_nt_n_sm50.cu rename to test/device/sm50_simt_minimum_multiplies_dsrgemm_nt_n.cu diff --git a/test/device/simt_minimum_multiplies_dsrgemm_nt_t_sm50.cu b/test/device/sm50_simt_minimum_multiplies_dsrgemm_nt_t.cu similarity index 100% rename from test/device/simt_minimum_multiplies_dsrgemm_nt_t_sm50.cu rename to test/device/sm50_simt_minimum_multiplies_dsrgemm_nt_t.cu diff --git a/test/device/simt_minimum_multiplies_dsrgemm_tn_n_sm50.cu b/test/device/sm50_simt_minimum_multiplies_dsrgemm_tn_n.cu similarity index 100% rename from test/device/simt_minimum_multiplies_dsrgemm_tn_n_sm50.cu rename to test/device/sm50_simt_minimum_multiplies_dsrgemm_tn_n.cu diff --git a/test/device/simt_minimum_multiplies_dsrgemm_tn_t_sm50.cu b/test/device/sm50_simt_minimum_multiplies_dsrgemm_tn_t.cu similarity index 100% rename from test/device/simt_minimum_multiplies_dsrgemm_tn_t_sm50.cu rename to test/device/sm50_simt_minimum_multiplies_dsrgemm_tn_t.cu diff --git a/test/device/simt_minimum_multiplies_dsrgemm_tt_n_sm50.cu b/test/device/sm50_simt_minimum_multiplies_dsrgemm_tt_n.cu similarity index 100% rename from test/device/simt_minimum_multiplies_dsrgemm_tt_n_sm50.cu rename to test/device/sm50_simt_minimum_multiplies_dsrgemm_tt_n.cu diff --git a/test/device/simt_minimum_multiplies_dsrgemm_tt_t_sm50.cu b/test/device/sm50_simt_minimum_multiplies_dsrgemm_tt_t.cu similarity index 100% rename from test/device/simt_minimum_multiplies_dsrgemm_tt_t_sm50.cu rename to test/device/sm50_simt_minimum_multiplies_dsrgemm_tt_t.cu diff --git a/test/device/simt_minimum_multiplies_ssrgemm_nn_n_sm50.cu b/test/device/sm50_simt_minimum_multiplies_ssrgemm_nn_n.cu similarity index 100% rename from test/device/simt_minimum_multiplies_ssrgemm_nn_n_sm50.cu rename to test/device/sm50_simt_minimum_multiplies_ssrgemm_nn_n.cu diff --git a/test/device/simt_minimum_multiplies_ssrgemm_nn_t_sm50.cu b/test/device/sm50_simt_minimum_multiplies_ssrgemm_nn_t.cu similarity index 100% rename from test/device/simt_minimum_multiplies_ssrgemm_nn_t_sm50.cu rename to test/device/sm50_simt_minimum_multiplies_ssrgemm_nn_t.cu diff --git a/test/device/simt_minimum_multiplies_ssrgemm_nt_n_sm50.cu b/test/device/sm50_simt_minimum_multiplies_ssrgemm_nt_n.cu similarity index 100% rename from test/device/simt_minimum_multiplies_ssrgemm_nt_n_sm50.cu rename to test/device/sm50_simt_minimum_multiplies_ssrgemm_nt_n.cu diff --git a/test/device/simt_minimum_multiplies_ssrgemm_nt_t_sm50.cu b/test/device/sm50_simt_minimum_multiplies_ssrgemm_nt_t.cu similarity index 100% rename from test/device/simt_minimum_multiplies_ssrgemm_nt_t_sm50.cu rename to test/device/sm50_simt_minimum_multiplies_ssrgemm_nt_t.cu diff --git a/test/device/simt_minimum_multiplies_ssrgemm_tn_n_sm50.cu b/test/device/sm50_simt_minimum_multiplies_ssrgemm_tn_n.cu similarity index 100% rename from test/device/simt_minimum_multiplies_ssrgemm_tn_n_sm50.cu rename to test/device/sm50_simt_minimum_multiplies_ssrgemm_tn_n.cu diff --git a/test/device/simt_minimum_multiplies_ssrgemm_tn_t_sm50.cu b/test/device/sm50_simt_minimum_multiplies_ssrgemm_tn_t.cu similarity index 100% rename from test/device/simt_minimum_multiplies_ssrgemm_tn_t_sm50.cu rename to test/device/sm50_simt_minimum_multiplies_ssrgemm_tn_t.cu diff --git a/test/device/simt_minimum_multiplies_ssrgemm_tt_n_sm50.cu b/test/device/sm50_simt_minimum_multiplies_ssrgemm_tt_n.cu similarity index 100% rename from test/device/simt_minimum_multiplies_ssrgemm_tt_n_sm50.cu rename to test/device/sm50_simt_minimum_multiplies_ssrgemm_tt_n.cu diff --git a/test/device/simt_minimum_multiplies_ssrgemm_tt_t_sm50.cu b/test/device/sm50_simt_minimum_multiplies_ssrgemm_tt_t.cu similarity index 100% rename from test/device/simt_minimum_multiplies_ssrgemm_tt_t_sm50.cu rename to test/device/sm50_simt_minimum_multiplies_ssrgemm_tt_t.cu diff --git a/test/device/simt_minimum_plus_dsrgemm_nn_n_sm50.cu b/test/device/sm50_simt_minimum_plus_dsrgemm_nn_n.cu similarity index 100% rename from test/device/simt_minimum_plus_dsrgemm_nn_n_sm50.cu rename to test/device/sm50_simt_minimum_plus_dsrgemm_nn_n.cu diff --git a/test/device/simt_minimum_plus_dsrgemm_nn_t_sm50.cu b/test/device/sm50_simt_minimum_plus_dsrgemm_nn_t.cu similarity index 100% rename from test/device/simt_minimum_plus_dsrgemm_nn_t_sm50.cu rename to test/device/sm50_simt_minimum_plus_dsrgemm_nn_t.cu diff --git a/test/device/simt_minimum_plus_dsrgemm_nt_n_sm50.cu b/test/device/sm50_simt_minimum_plus_dsrgemm_nt_n.cu similarity index 100% rename from test/device/simt_minimum_plus_dsrgemm_nt_n_sm50.cu rename to test/device/sm50_simt_minimum_plus_dsrgemm_nt_n.cu diff --git a/test/device/simt_minimum_plus_dsrgemm_nt_t_sm50.cu b/test/device/sm50_simt_minimum_plus_dsrgemm_nt_t.cu similarity index 100% rename from test/device/simt_minimum_plus_dsrgemm_nt_t_sm50.cu rename to test/device/sm50_simt_minimum_plus_dsrgemm_nt_t.cu diff --git a/test/device/simt_minimum_plus_dsrgemm_tn_n_sm50.cu b/test/device/sm50_simt_minimum_plus_dsrgemm_tn_n.cu similarity index 100% rename from test/device/simt_minimum_plus_dsrgemm_tn_n_sm50.cu rename to test/device/sm50_simt_minimum_plus_dsrgemm_tn_n.cu diff --git a/test/device/simt_minimum_plus_dsrgemm_tn_t_sm50.cu b/test/device/sm50_simt_minimum_plus_dsrgemm_tn_t.cu similarity index 100% rename from test/device/simt_minimum_plus_dsrgemm_tn_t_sm50.cu rename to test/device/sm50_simt_minimum_plus_dsrgemm_tn_t.cu diff --git a/test/device/simt_minimum_plus_dsrgemm_tt_n_sm50.cu b/test/device/sm50_simt_minimum_plus_dsrgemm_tt_n.cu similarity index 100% rename from test/device/simt_minimum_plus_dsrgemm_tt_n_sm50.cu rename to test/device/sm50_simt_minimum_plus_dsrgemm_tt_n.cu diff --git a/test/device/simt_minimum_plus_dsrgemm_tt_t_sm50.cu b/test/device/sm50_simt_minimum_plus_dsrgemm_tt_t.cu similarity index 100% rename from test/device/simt_minimum_plus_dsrgemm_tt_t_sm50.cu rename to test/device/sm50_simt_minimum_plus_dsrgemm_tt_t.cu diff --git a/test/device/simt_minimum_plus_ssrgemm_nn_n_sm50.cu b/test/device/sm50_simt_minimum_plus_ssrgemm_nn_n.cu similarity index 100% rename from test/device/simt_minimum_plus_ssrgemm_nn_n_sm50.cu rename to test/device/sm50_simt_minimum_plus_ssrgemm_nn_n.cu diff --git a/test/device/simt_minimum_plus_ssrgemm_nn_t_sm50.cu b/test/device/sm50_simt_minimum_plus_ssrgemm_nn_t.cu similarity index 100% rename from test/device/simt_minimum_plus_ssrgemm_nn_t_sm50.cu rename to test/device/sm50_simt_minimum_plus_ssrgemm_nn_t.cu diff --git a/test/device/simt_minimum_plus_ssrgemm_nt_n_sm50.cu b/test/device/sm50_simt_minimum_plus_ssrgemm_nt_n.cu similarity index 100% rename from test/device/simt_minimum_plus_ssrgemm_nt_n_sm50.cu rename to test/device/sm50_simt_minimum_plus_ssrgemm_nt_n.cu diff --git a/test/device/simt_minimum_plus_ssrgemm_nt_t_sm50.cu b/test/device/sm50_simt_minimum_plus_ssrgemm_nt_t.cu similarity index 100% rename from test/device/simt_minimum_plus_ssrgemm_nt_t_sm50.cu rename to test/device/sm50_simt_minimum_plus_ssrgemm_nt_t.cu diff --git a/test/device/simt_minimum_plus_ssrgemm_tn_n_sm50.cu b/test/device/sm50_simt_minimum_plus_ssrgemm_tn_n.cu similarity index 100% rename from test/device/simt_minimum_plus_ssrgemm_tn_n_sm50.cu rename to test/device/sm50_simt_minimum_plus_ssrgemm_tn_n.cu diff --git a/test/device/simt_minimum_plus_ssrgemm_tn_t_sm50.cu b/test/device/sm50_simt_minimum_plus_ssrgemm_tn_t.cu similarity index 100% rename from test/device/simt_minimum_plus_ssrgemm_tn_t_sm50.cu rename to test/device/sm50_simt_minimum_plus_ssrgemm_tn_t.cu diff --git a/test/device/simt_minimum_plus_ssrgemm_tt_n_sm50.cu b/test/device/sm50_simt_minimum_plus_ssrgemm_tt_n.cu similarity index 100% rename from test/device/simt_minimum_plus_ssrgemm_tt_n_sm50.cu rename to test/device/sm50_simt_minimum_plus_ssrgemm_tt_n.cu diff --git a/test/device/simt_minimum_plus_ssrgemm_tt_t_sm50.cu b/test/device/sm50_simt_minimum_plus_ssrgemm_tt_t.cu similarity index 100% rename from test/device/simt_minimum_plus_ssrgemm_tt_t_sm50.cu rename to test/device/sm50_simt_minimum_plus_ssrgemm_tt_t.cu diff --git a/test/device/simt_plus_multiplies_dsrgemm_nn_n_sm50.cu b/test/device/sm50_simt_plus_multiplies_dsrgemm_nn_n.cu similarity index 100% rename from test/device/simt_plus_multiplies_dsrgemm_nn_n_sm50.cu rename to test/device/sm50_simt_plus_multiplies_dsrgemm_nn_n.cu diff --git a/test/device/simt_plus_multiplies_dsrgemm_nn_t_sm50.cu b/test/device/sm50_simt_plus_multiplies_dsrgemm_nn_t.cu similarity index 100% rename from test/device/simt_plus_multiplies_dsrgemm_nn_t_sm50.cu rename to test/device/sm50_simt_plus_multiplies_dsrgemm_nn_t.cu diff --git a/test/device/simt_plus_multiplies_dsrgemm_nt_n_sm50.cu b/test/device/sm50_simt_plus_multiplies_dsrgemm_nt_n.cu similarity index 100% rename from test/device/simt_plus_multiplies_dsrgemm_nt_n_sm50.cu rename to test/device/sm50_simt_plus_multiplies_dsrgemm_nt_n.cu diff --git a/test/device/simt_plus_multiplies_dsrgemm_nt_t_sm50.cu b/test/device/sm50_simt_plus_multiplies_dsrgemm_nt_t.cu similarity index 100% rename from test/device/simt_plus_multiplies_dsrgemm_nt_t_sm50.cu rename to test/device/sm50_simt_plus_multiplies_dsrgemm_nt_t.cu diff --git a/test/device/simt_plus_multiplies_dsrgemm_tn_n_sm50.cu b/test/device/sm50_simt_plus_multiplies_dsrgemm_tn_n.cu similarity index 100% rename from test/device/simt_plus_multiplies_dsrgemm_tn_n_sm50.cu rename to test/device/sm50_simt_plus_multiplies_dsrgemm_tn_n.cu diff --git a/test/device/simt_plus_multiplies_dsrgemm_tn_t_sm50.cu b/test/device/sm50_simt_plus_multiplies_dsrgemm_tn_t.cu similarity index 100% rename from test/device/simt_plus_multiplies_dsrgemm_tn_t_sm50.cu rename to test/device/sm50_simt_plus_multiplies_dsrgemm_tn_t.cu diff --git a/test/device/simt_plus_multiplies_dsrgemm_tt_n_sm50.cu b/test/device/sm50_simt_plus_multiplies_dsrgemm_tt_n.cu similarity index 100% rename from test/device/simt_plus_multiplies_dsrgemm_tt_n_sm50.cu rename to test/device/sm50_simt_plus_multiplies_dsrgemm_tt_n.cu diff --git a/test/device/simt_plus_multiplies_dsrgemm_tt_t_sm50.cu b/test/device/sm50_simt_plus_multiplies_dsrgemm_tt_t.cu similarity index 100% rename from test/device/simt_plus_multiplies_dsrgemm_tt_t_sm50.cu rename to test/device/sm50_simt_plus_multiplies_dsrgemm_tt_t.cu diff --git a/test/device/simt_plus_multiplies_ssrgemm_nn_n_sm50.cu b/test/device/sm50_simt_plus_multiplies_ssrgemm_nn_n.cu similarity index 100% rename from test/device/simt_plus_multiplies_ssrgemm_nn_n_sm50.cu rename to test/device/sm50_simt_plus_multiplies_ssrgemm_nn_n.cu diff --git a/test/device/simt_plus_multiplies_ssrgemm_nn_t_sm50.cu b/test/device/sm50_simt_plus_multiplies_ssrgemm_nn_t.cu similarity index 100% rename from test/device/simt_plus_multiplies_ssrgemm_nn_t_sm50.cu rename to test/device/sm50_simt_plus_multiplies_ssrgemm_nn_t.cu diff --git a/test/device/simt_plus_multiplies_ssrgemm_nt_n_sm50.cu b/test/device/sm50_simt_plus_multiplies_ssrgemm_nt_n.cu similarity index 100% rename from test/device/simt_plus_multiplies_ssrgemm_nt_n_sm50.cu rename to test/device/sm50_simt_plus_multiplies_ssrgemm_nt_n.cu diff --git a/test/device/simt_plus_multiplies_ssrgemm_nt_t_sm50.cu b/test/device/sm50_simt_plus_multiplies_ssrgemm_nt_t.cu similarity index 100% rename from test/device/simt_plus_multiplies_ssrgemm_nt_t_sm50.cu rename to test/device/sm50_simt_plus_multiplies_ssrgemm_nt_t.cu diff --git a/test/device/simt_plus_multiplies_ssrgemm_tn_n_sm50.cu b/test/device/sm50_simt_plus_multiplies_ssrgemm_tn_n.cu similarity index 100% rename from test/device/simt_plus_multiplies_ssrgemm_tn_n_sm50.cu rename to test/device/sm50_simt_plus_multiplies_ssrgemm_tn_n.cu diff --git a/test/device/simt_plus_multiplies_ssrgemm_tn_t_sm50.cu b/test/device/sm50_simt_plus_multiplies_ssrgemm_tn_t.cu similarity index 100% rename from test/device/simt_plus_multiplies_ssrgemm_tn_t_sm50.cu rename to test/device/sm50_simt_plus_multiplies_ssrgemm_tn_t.cu diff --git a/test/device/simt_plus_multiplies_ssrgemm_tt_n_sm50.cu b/test/device/sm50_simt_plus_multiplies_ssrgemm_tt_n.cu similarity index 100% rename from test/device/simt_plus_multiplies_ssrgemm_tt_n_sm50.cu rename to test/device/sm50_simt_plus_multiplies_ssrgemm_tt_n.cu diff --git a/test/device/simt_plus_multiplies_ssrgemm_tt_t_sm50.cu b/test/device/sm50_simt_plus_multiplies_ssrgemm_tt_t.cu similarity index 100% rename from test/device/simt_plus_multiplies_ssrgemm_tt_t_sm50.cu rename to test/device/sm50_simt_plus_multiplies_ssrgemm_tt_t.cu From 6b7fa2346302e5250e39157d55f37862dae8edea Mon Sep 17 00:00:00 2001 From: Void Date: Sun, 31 Oct 2021 09:18:23 -0400 Subject: [PATCH 06/15] generalize bench generator and rename bench files in prep for SM80 --- bench/device/{simt_sm50.py => gen_simt.py} | 34 ++++++++++++------- ...simt_binary_or_binary_and_dsrgemm_nn_n.cu} | 0 ...simt_binary_or_binary_and_dsrgemm_nn_t.cu} | 0 ...simt_binary_or_binary_and_dsrgemm_nt_n.cu} | 0 ...simt_binary_or_binary_and_dsrgemm_nt_t.cu} | 0 ...simt_binary_or_binary_and_dsrgemm_tn_n.cu} | 0 ...simt_binary_or_binary_and_dsrgemm_tn_t.cu} | 0 ...simt_binary_or_binary_and_dsrgemm_tt_n.cu} | 0 ...simt_binary_or_binary_and_dsrgemm_tt_t.cu} | 0 ...simt_binary_or_binary_and_ssrgemm_nn_n.cu} | 0 ...simt_binary_or_binary_and_ssrgemm_nn_t.cu} | 0 ...simt_binary_or_binary_and_ssrgemm_nt_n.cu} | 0 ...simt_binary_or_binary_and_ssrgemm_nt_t.cu} | 0 ...simt_binary_or_binary_and_ssrgemm_tn_n.cu} | 0 ...simt_binary_or_binary_and_ssrgemm_tn_t.cu} | 0 ...simt_binary_or_binary_and_ssrgemm_tt_n.cu} | 0 ...simt_binary_or_binary_and_ssrgemm_tt_t.cu} | 0 ...sm50_simt_maximum_minimum_dsrgemm_nn_n.cu} | 0 ...sm50_simt_maximum_minimum_dsrgemm_nn_t.cu} | 0 ...sm50_simt_maximum_minimum_dsrgemm_nt_n.cu} | 0 ...sm50_simt_maximum_minimum_dsrgemm_nt_t.cu} | 0 ...sm50_simt_maximum_minimum_dsrgemm_tn_n.cu} | 0 ...sm50_simt_maximum_minimum_dsrgemm_tn_t.cu} | 0 ...sm50_simt_maximum_minimum_dsrgemm_tt_n.cu} | 0 ...sm50_simt_maximum_minimum_dsrgemm_tt_t.cu} | 0 ...sm50_simt_maximum_minimum_ssrgemm_nn_n.cu} | 0 ...sm50_simt_maximum_minimum_ssrgemm_nn_t.cu} | 0 ...sm50_simt_maximum_minimum_ssrgemm_nt_n.cu} | 0 ...sm50_simt_maximum_minimum_ssrgemm_nt_t.cu} | 0 ...sm50_simt_maximum_minimum_ssrgemm_tn_n.cu} | 0 ...sm50_simt_maximum_minimum_ssrgemm_tn_t.cu} | 0 ...sm50_simt_maximum_minimum_ssrgemm_tt_n.cu} | 0 ...sm50_simt_maximum_minimum_ssrgemm_tt_t.cu} | 0 ...0_simt_maximum_multiplies_dsrgemm_nn_n.cu} | 0 ...0_simt_maximum_multiplies_dsrgemm_nn_t.cu} | 0 ...0_simt_maximum_multiplies_dsrgemm_nt_n.cu} | 0 ...0_simt_maximum_multiplies_dsrgemm_nt_t.cu} | 0 ...0_simt_maximum_multiplies_dsrgemm_tn_n.cu} | 0 ...0_simt_maximum_multiplies_dsrgemm_tn_t.cu} | 0 ...0_simt_maximum_multiplies_dsrgemm_tt_n.cu} | 0 ...0_simt_maximum_multiplies_dsrgemm_tt_t.cu} | 0 ...0_simt_maximum_multiplies_ssrgemm_nn_n.cu} | 0 ...0_simt_maximum_multiplies_ssrgemm_nn_t.cu} | 0 ...0_simt_maximum_multiplies_ssrgemm_nt_n.cu} | 0 ...0_simt_maximum_multiplies_ssrgemm_nt_t.cu} | 0 ...0_simt_maximum_multiplies_ssrgemm_tn_n.cu} | 0 ...0_simt_maximum_multiplies_ssrgemm_tn_t.cu} | 0 ...0_simt_maximum_multiplies_ssrgemm_tt_n.cu} | 0 ...0_simt_maximum_multiplies_ssrgemm_tt_t.cu} | 0 ...=> sm50_simt_maximum_plus_dsrgemm_nn_n.cu} | 0 ...=> sm50_simt_maximum_plus_dsrgemm_nn_t.cu} | 0 ...=> sm50_simt_maximum_plus_dsrgemm_nt_n.cu} | 0 ...=> sm50_simt_maximum_plus_dsrgemm_nt_t.cu} | 0 ...=> sm50_simt_maximum_plus_dsrgemm_tn_n.cu} | 0 ...=> sm50_simt_maximum_plus_dsrgemm_tn_t.cu} | 0 ...=> sm50_simt_maximum_plus_dsrgemm_tt_n.cu} | 0 ...=> sm50_simt_maximum_plus_dsrgemm_tt_t.cu} | 0 ...=> sm50_simt_maximum_plus_ssrgemm_nn_n.cu} | 0 ...=> sm50_simt_maximum_plus_ssrgemm_nn_t.cu} | 0 ...=> sm50_simt_maximum_plus_ssrgemm_nt_n.cu} | 0 ...=> sm50_simt_maximum_plus_ssrgemm_nt_t.cu} | 0 ...=> sm50_simt_maximum_plus_ssrgemm_tn_n.cu} | 0 ...=> sm50_simt_maximum_plus_ssrgemm_tn_t.cu} | 0 ...=> sm50_simt_maximum_plus_ssrgemm_tt_n.cu} | 0 ...=> sm50_simt_maximum_plus_ssrgemm_tt_t.cu} | 0 ...sm50_simt_minimum_maximum_dsrgemm_nn_n.cu} | 0 ...sm50_simt_minimum_maximum_dsrgemm_nn_t.cu} | 0 ...sm50_simt_minimum_maximum_dsrgemm_nt_n.cu} | 0 ...sm50_simt_minimum_maximum_dsrgemm_nt_t.cu} | 0 ...sm50_simt_minimum_maximum_dsrgemm_tn_n.cu} | 0 ...sm50_simt_minimum_maximum_dsrgemm_tn_t.cu} | 0 ...sm50_simt_minimum_maximum_dsrgemm_tt_n.cu} | 0 ...sm50_simt_minimum_maximum_dsrgemm_tt_t.cu} | 0 ...sm50_simt_minimum_maximum_ssrgemm_nn_n.cu} | 0 ...sm50_simt_minimum_maximum_ssrgemm_nn_t.cu} | 0 ...sm50_simt_minimum_maximum_ssrgemm_nt_n.cu} | 0 ...sm50_simt_minimum_maximum_ssrgemm_nt_t.cu} | 0 ...sm50_simt_minimum_maximum_ssrgemm_tn_n.cu} | 0 ...sm50_simt_minimum_maximum_ssrgemm_tn_t.cu} | 0 ...sm50_simt_minimum_maximum_ssrgemm_tt_n.cu} | 0 ...sm50_simt_minimum_maximum_ssrgemm_tt_t.cu} | 0 ...0_simt_minimum_multiplies_dsrgemm_nn_n.cu} | 0 ...0_simt_minimum_multiplies_dsrgemm_nn_t.cu} | 0 ...0_simt_minimum_multiplies_dsrgemm_nt_n.cu} | 0 ...0_simt_minimum_multiplies_dsrgemm_nt_t.cu} | 0 ...0_simt_minimum_multiplies_dsrgemm_tn_n.cu} | 0 ...0_simt_minimum_multiplies_dsrgemm_tn_t.cu} | 0 ...0_simt_minimum_multiplies_dsrgemm_tt_n.cu} | 0 ...0_simt_minimum_multiplies_dsrgemm_tt_t.cu} | 0 ...0_simt_minimum_multiplies_ssrgemm_nn_n.cu} | 0 ...0_simt_minimum_multiplies_ssrgemm_nn_t.cu} | 0 ...0_simt_minimum_multiplies_ssrgemm_nt_n.cu} | 0 ...0_simt_minimum_multiplies_ssrgemm_nt_t.cu} | 0 ...0_simt_minimum_multiplies_ssrgemm_tn_n.cu} | 0 ...0_simt_minimum_multiplies_ssrgemm_tn_t.cu} | 0 ...0_simt_minimum_multiplies_ssrgemm_tt_n.cu} | 0 ...0_simt_minimum_multiplies_ssrgemm_tt_t.cu} | 0 ...=> sm50_simt_minimum_plus_dsrgemm_nn_n.cu} | 0 ...=> sm50_simt_minimum_plus_dsrgemm_nn_t.cu} | 0 ...=> sm50_simt_minimum_plus_dsrgemm_nt_n.cu} | 0 ...=> sm50_simt_minimum_plus_dsrgemm_nt_t.cu} | 0 ...=> sm50_simt_minimum_plus_dsrgemm_tn_n.cu} | 0 ...=> sm50_simt_minimum_plus_dsrgemm_tn_t.cu} | 0 ...=> sm50_simt_minimum_plus_dsrgemm_tt_n.cu} | 0 ...=> sm50_simt_minimum_plus_dsrgemm_tt_t.cu} | 0 ...=> sm50_simt_minimum_plus_ssrgemm_nn_n.cu} | 0 ...=> sm50_simt_minimum_plus_ssrgemm_nn_t.cu} | 0 ...=> sm50_simt_minimum_plus_ssrgemm_nt_n.cu} | 0 ...=> sm50_simt_minimum_plus_ssrgemm_nt_t.cu} | 0 ...=> sm50_simt_minimum_plus_ssrgemm_tn_n.cu} | 0 ...=> sm50_simt_minimum_plus_ssrgemm_tn_t.cu} | 0 ...=> sm50_simt_minimum_plus_ssrgemm_tt_n.cu} | 0 ...=> sm50_simt_minimum_plus_ssrgemm_tt_t.cu} | 0 ...sm50_simt_plus_multiplies_dsrgemm_nn_n.cu} | 0 ...sm50_simt_plus_multiplies_dsrgemm_nn_t.cu} | 0 ...sm50_simt_plus_multiplies_dsrgemm_nt_n.cu} | 0 ...sm50_simt_plus_multiplies_dsrgemm_nt_t.cu} | 0 ...sm50_simt_plus_multiplies_dsrgemm_tn_n.cu} | 0 ...sm50_simt_plus_multiplies_dsrgemm_tn_t.cu} | 0 ...sm50_simt_plus_multiplies_dsrgemm_tt_n.cu} | 0 ...sm50_simt_plus_multiplies_dsrgemm_tt_t.cu} | 0 ...sm50_simt_plus_multiplies_ssrgemm_nn_n.cu} | 0 ...sm50_simt_plus_multiplies_ssrgemm_nn_t.cu} | 0 ...sm50_simt_plus_multiplies_ssrgemm_nt_n.cu} | 0 ...sm50_simt_plus_multiplies_ssrgemm_nt_t.cu} | 0 ...sm50_simt_plus_multiplies_ssrgemm_tn_n.cu} | 0 ...sm50_simt_plus_multiplies_ssrgemm_tn_t.cu} | 0 ...sm50_simt_plus_multiplies_ssrgemm_tt_n.cu} | 0 ...sm50_simt_plus_multiplies_ssrgemm_tt_t.cu} | 0 129 files changed, 22 insertions(+), 12 deletions(-) rename bench/device/{simt_sm50.py => gen_simt.py} (92%) rename bench/device/{simt_binary_or_binary_and_dsrgemm_nn_n_sm50.cu => sm50_simt_binary_or_binary_and_dsrgemm_nn_n.cu} (100%) rename bench/device/{simt_binary_or_binary_and_dsrgemm_nn_t_sm50.cu => sm50_simt_binary_or_binary_and_dsrgemm_nn_t.cu} (100%) rename bench/device/{simt_binary_or_binary_and_dsrgemm_nt_n_sm50.cu => sm50_simt_binary_or_binary_and_dsrgemm_nt_n.cu} (100%) rename bench/device/{simt_binary_or_binary_and_dsrgemm_nt_t_sm50.cu => sm50_simt_binary_or_binary_and_dsrgemm_nt_t.cu} (100%) rename bench/device/{simt_binary_or_binary_and_dsrgemm_tn_n_sm50.cu => sm50_simt_binary_or_binary_and_dsrgemm_tn_n.cu} (100%) rename bench/device/{simt_binary_or_binary_and_dsrgemm_tn_t_sm50.cu => sm50_simt_binary_or_binary_and_dsrgemm_tn_t.cu} (100%) rename bench/device/{simt_binary_or_binary_and_dsrgemm_tt_n_sm50.cu => sm50_simt_binary_or_binary_and_dsrgemm_tt_n.cu} (100%) rename bench/device/{simt_binary_or_binary_and_dsrgemm_tt_t_sm50.cu => sm50_simt_binary_or_binary_and_dsrgemm_tt_t.cu} (100%) rename bench/device/{simt_binary_or_binary_and_ssrgemm_nn_n_sm50.cu => sm50_simt_binary_or_binary_and_ssrgemm_nn_n.cu} (100%) rename bench/device/{simt_binary_or_binary_and_ssrgemm_nn_t_sm50.cu => sm50_simt_binary_or_binary_and_ssrgemm_nn_t.cu} (100%) rename bench/device/{simt_binary_or_binary_and_ssrgemm_nt_n_sm50.cu => sm50_simt_binary_or_binary_and_ssrgemm_nt_n.cu} (100%) rename bench/device/{simt_binary_or_binary_and_ssrgemm_nt_t_sm50.cu => sm50_simt_binary_or_binary_and_ssrgemm_nt_t.cu} (100%) rename bench/device/{simt_binary_or_binary_and_ssrgemm_tn_n_sm50.cu => sm50_simt_binary_or_binary_and_ssrgemm_tn_n.cu} (100%) rename bench/device/{simt_binary_or_binary_and_ssrgemm_tn_t_sm50.cu => sm50_simt_binary_or_binary_and_ssrgemm_tn_t.cu} (100%) rename bench/device/{simt_binary_or_binary_and_ssrgemm_tt_n_sm50.cu => sm50_simt_binary_or_binary_and_ssrgemm_tt_n.cu} (100%) rename bench/device/{simt_binary_or_binary_and_ssrgemm_tt_t_sm50.cu => sm50_simt_binary_or_binary_and_ssrgemm_tt_t.cu} (100%) rename bench/device/{simt_maximum_minimum_dsrgemm_nn_n_sm50.cu => sm50_simt_maximum_minimum_dsrgemm_nn_n.cu} (100%) rename bench/device/{simt_maximum_minimum_dsrgemm_nn_t_sm50.cu => sm50_simt_maximum_minimum_dsrgemm_nn_t.cu} (100%) rename bench/device/{simt_maximum_minimum_dsrgemm_nt_n_sm50.cu => sm50_simt_maximum_minimum_dsrgemm_nt_n.cu} (100%) rename bench/device/{simt_maximum_minimum_dsrgemm_nt_t_sm50.cu => sm50_simt_maximum_minimum_dsrgemm_nt_t.cu} (100%) rename bench/device/{simt_maximum_minimum_dsrgemm_tn_n_sm50.cu => sm50_simt_maximum_minimum_dsrgemm_tn_n.cu} (100%) rename bench/device/{simt_maximum_minimum_dsrgemm_tn_t_sm50.cu => sm50_simt_maximum_minimum_dsrgemm_tn_t.cu} (100%) rename bench/device/{simt_maximum_minimum_dsrgemm_tt_n_sm50.cu => sm50_simt_maximum_minimum_dsrgemm_tt_n.cu} (100%) rename bench/device/{simt_maximum_minimum_dsrgemm_tt_t_sm50.cu => sm50_simt_maximum_minimum_dsrgemm_tt_t.cu} (100%) rename bench/device/{simt_maximum_minimum_ssrgemm_nn_n_sm50.cu => sm50_simt_maximum_minimum_ssrgemm_nn_n.cu} (100%) rename bench/device/{simt_maximum_minimum_ssrgemm_nn_t_sm50.cu => sm50_simt_maximum_minimum_ssrgemm_nn_t.cu} (100%) rename bench/device/{simt_maximum_minimum_ssrgemm_nt_n_sm50.cu => sm50_simt_maximum_minimum_ssrgemm_nt_n.cu} (100%) rename bench/device/{simt_maximum_minimum_ssrgemm_nt_t_sm50.cu => sm50_simt_maximum_minimum_ssrgemm_nt_t.cu} (100%) rename bench/device/{simt_maximum_minimum_ssrgemm_tn_n_sm50.cu => sm50_simt_maximum_minimum_ssrgemm_tn_n.cu} (100%) rename bench/device/{simt_maximum_minimum_ssrgemm_tn_t_sm50.cu => sm50_simt_maximum_minimum_ssrgemm_tn_t.cu} (100%) rename bench/device/{simt_maximum_minimum_ssrgemm_tt_n_sm50.cu => sm50_simt_maximum_minimum_ssrgemm_tt_n.cu} (100%) rename bench/device/{simt_maximum_minimum_ssrgemm_tt_t_sm50.cu => sm50_simt_maximum_minimum_ssrgemm_tt_t.cu} (100%) rename bench/device/{simt_maximum_multiplies_dsrgemm_nn_n_sm50.cu => sm50_simt_maximum_multiplies_dsrgemm_nn_n.cu} (100%) rename bench/device/{simt_maximum_multiplies_dsrgemm_nn_t_sm50.cu => sm50_simt_maximum_multiplies_dsrgemm_nn_t.cu} (100%) rename bench/device/{simt_maximum_multiplies_dsrgemm_nt_n_sm50.cu => sm50_simt_maximum_multiplies_dsrgemm_nt_n.cu} (100%) rename bench/device/{simt_maximum_multiplies_dsrgemm_nt_t_sm50.cu => sm50_simt_maximum_multiplies_dsrgemm_nt_t.cu} (100%) rename bench/device/{simt_maximum_multiplies_dsrgemm_tn_n_sm50.cu => sm50_simt_maximum_multiplies_dsrgemm_tn_n.cu} (100%) rename bench/device/{simt_maximum_multiplies_dsrgemm_tn_t_sm50.cu => sm50_simt_maximum_multiplies_dsrgemm_tn_t.cu} (100%) rename bench/device/{simt_maximum_multiplies_dsrgemm_tt_n_sm50.cu => sm50_simt_maximum_multiplies_dsrgemm_tt_n.cu} (100%) rename bench/device/{simt_maximum_multiplies_dsrgemm_tt_t_sm50.cu => sm50_simt_maximum_multiplies_dsrgemm_tt_t.cu} (100%) rename bench/device/{simt_maximum_multiplies_ssrgemm_nn_n_sm50.cu => sm50_simt_maximum_multiplies_ssrgemm_nn_n.cu} (100%) rename bench/device/{simt_maximum_multiplies_ssrgemm_nn_t_sm50.cu => sm50_simt_maximum_multiplies_ssrgemm_nn_t.cu} (100%) rename bench/device/{simt_maximum_multiplies_ssrgemm_nt_n_sm50.cu => sm50_simt_maximum_multiplies_ssrgemm_nt_n.cu} (100%) rename bench/device/{simt_maximum_multiplies_ssrgemm_nt_t_sm50.cu => sm50_simt_maximum_multiplies_ssrgemm_nt_t.cu} (100%) rename bench/device/{simt_maximum_multiplies_ssrgemm_tn_n_sm50.cu => sm50_simt_maximum_multiplies_ssrgemm_tn_n.cu} (100%) rename bench/device/{simt_maximum_multiplies_ssrgemm_tn_t_sm50.cu => sm50_simt_maximum_multiplies_ssrgemm_tn_t.cu} (100%) rename bench/device/{simt_maximum_multiplies_ssrgemm_tt_n_sm50.cu => sm50_simt_maximum_multiplies_ssrgemm_tt_n.cu} (100%) rename bench/device/{simt_maximum_multiplies_ssrgemm_tt_t_sm50.cu => sm50_simt_maximum_multiplies_ssrgemm_tt_t.cu} (100%) rename bench/device/{simt_maximum_plus_dsrgemm_nn_n_sm50.cu => sm50_simt_maximum_plus_dsrgemm_nn_n.cu} (100%) rename bench/device/{simt_maximum_plus_dsrgemm_nn_t_sm50.cu => sm50_simt_maximum_plus_dsrgemm_nn_t.cu} (100%) rename bench/device/{simt_maximum_plus_dsrgemm_nt_n_sm50.cu => sm50_simt_maximum_plus_dsrgemm_nt_n.cu} (100%) rename bench/device/{simt_maximum_plus_dsrgemm_nt_t_sm50.cu => sm50_simt_maximum_plus_dsrgemm_nt_t.cu} (100%) rename bench/device/{simt_maximum_plus_dsrgemm_tn_n_sm50.cu => sm50_simt_maximum_plus_dsrgemm_tn_n.cu} (100%) rename bench/device/{simt_maximum_plus_dsrgemm_tn_t_sm50.cu => sm50_simt_maximum_plus_dsrgemm_tn_t.cu} (100%) rename bench/device/{simt_maximum_plus_dsrgemm_tt_n_sm50.cu => sm50_simt_maximum_plus_dsrgemm_tt_n.cu} (100%) rename bench/device/{simt_maximum_plus_dsrgemm_tt_t_sm50.cu => sm50_simt_maximum_plus_dsrgemm_tt_t.cu} (100%) rename bench/device/{simt_maximum_plus_ssrgemm_nn_n_sm50.cu => sm50_simt_maximum_plus_ssrgemm_nn_n.cu} (100%) rename bench/device/{simt_maximum_plus_ssrgemm_nn_t_sm50.cu => sm50_simt_maximum_plus_ssrgemm_nn_t.cu} (100%) rename bench/device/{simt_maximum_plus_ssrgemm_nt_n_sm50.cu => sm50_simt_maximum_plus_ssrgemm_nt_n.cu} (100%) rename bench/device/{simt_maximum_plus_ssrgemm_nt_t_sm50.cu => sm50_simt_maximum_plus_ssrgemm_nt_t.cu} (100%) rename bench/device/{simt_maximum_plus_ssrgemm_tn_n_sm50.cu => sm50_simt_maximum_plus_ssrgemm_tn_n.cu} (100%) rename bench/device/{simt_maximum_plus_ssrgemm_tn_t_sm50.cu => sm50_simt_maximum_plus_ssrgemm_tn_t.cu} (100%) rename bench/device/{simt_maximum_plus_ssrgemm_tt_n_sm50.cu => sm50_simt_maximum_plus_ssrgemm_tt_n.cu} (100%) rename bench/device/{simt_maximum_plus_ssrgemm_tt_t_sm50.cu => sm50_simt_maximum_plus_ssrgemm_tt_t.cu} (100%) rename bench/device/{simt_minimum_maximum_dsrgemm_nn_n_sm50.cu => sm50_simt_minimum_maximum_dsrgemm_nn_n.cu} (100%) rename bench/device/{simt_minimum_maximum_dsrgemm_nn_t_sm50.cu => sm50_simt_minimum_maximum_dsrgemm_nn_t.cu} (100%) rename bench/device/{simt_minimum_maximum_dsrgemm_nt_n_sm50.cu => sm50_simt_minimum_maximum_dsrgemm_nt_n.cu} (100%) rename bench/device/{simt_minimum_maximum_dsrgemm_nt_t_sm50.cu => sm50_simt_minimum_maximum_dsrgemm_nt_t.cu} (100%) rename bench/device/{simt_minimum_maximum_dsrgemm_tn_n_sm50.cu => sm50_simt_minimum_maximum_dsrgemm_tn_n.cu} (100%) rename bench/device/{simt_minimum_maximum_dsrgemm_tn_t_sm50.cu => sm50_simt_minimum_maximum_dsrgemm_tn_t.cu} (100%) rename bench/device/{simt_minimum_maximum_dsrgemm_tt_n_sm50.cu => sm50_simt_minimum_maximum_dsrgemm_tt_n.cu} (100%) rename bench/device/{simt_minimum_maximum_dsrgemm_tt_t_sm50.cu => sm50_simt_minimum_maximum_dsrgemm_tt_t.cu} (100%) rename bench/device/{simt_minimum_maximum_ssrgemm_nn_n_sm50.cu => sm50_simt_minimum_maximum_ssrgemm_nn_n.cu} (100%) rename bench/device/{simt_minimum_maximum_ssrgemm_nn_t_sm50.cu => sm50_simt_minimum_maximum_ssrgemm_nn_t.cu} (100%) rename bench/device/{simt_minimum_maximum_ssrgemm_nt_n_sm50.cu => sm50_simt_minimum_maximum_ssrgemm_nt_n.cu} (100%) rename bench/device/{simt_minimum_maximum_ssrgemm_nt_t_sm50.cu => sm50_simt_minimum_maximum_ssrgemm_nt_t.cu} (100%) rename bench/device/{simt_minimum_maximum_ssrgemm_tn_n_sm50.cu => sm50_simt_minimum_maximum_ssrgemm_tn_n.cu} (100%) rename bench/device/{simt_minimum_maximum_ssrgemm_tn_t_sm50.cu => sm50_simt_minimum_maximum_ssrgemm_tn_t.cu} (100%) rename bench/device/{simt_minimum_maximum_ssrgemm_tt_n_sm50.cu => sm50_simt_minimum_maximum_ssrgemm_tt_n.cu} (100%) rename bench/device/{simt_minimum_maximum_ssrgemm_tt_t_sm50.cu => sm50_simt_minimum_maximum_ssrgemm_tt_t.cu} (100%) rename bench/device/{simt_minimum_multiplies_dsrgemm_nn_n_sm50.cu => sm50_simt_minimum_multiplies_dsrgemm_nn_n.cu} (100%) rename bench/device/{simt_minimum_multiplies_dsrgemm_nn_t_sm50.cu => sm50_simt_minimum_multiplies_dsrgemm_nn_t.cu} (100%) rename bench/device/{simt_minimum_multiplies_dsrgemm_nt_n_sm50.cu => sm50_simt_minimum_multiplies_dsrgemm_nt_n.cu} (100%) rename bench/device/{simt_minimum_multiplies_dsrgemm_nt_t_sm50.cu => sm50_simt_minimum_multiplies_dsrgemm_nt_t.cu} (100%) rename bench/device/{simt_minimum_multiplies_dsrgemm_tn_n_sm50.cu => sm50_simt_minimum_multiplies_dsrgemm_tn_n.cu} (100%) rename bench/device/{simt_minimum_multiplies_dsrgemm_tn_t_sm50.cu => sm50_simt_minimum_multiplies_dsrgemm_tn_t.cu} (100%) rename bench/device/{simt_minimum_multiplies_dsrgemm_tt_n_sm50.cu => sm50_simt_minimum_multiplies_dsrgemm_tt_n.cu} (100%) rename bench/device/{simt_minimum_multiplies_dsrgemm_tt_t_sm50.cu => sm50_simt_minimum_multiplies_dsrgemm_tt_t.cu} (100%) rename bench/device/{simt_minimum_multiplies_ssrgemm_nn_n_sm50.cu => sm50_simt_minimum_multiplies_ssrgemm_nn_n.cu} (100%) rename bench/device/{simt_minimum_multiplies_ssrgemm_nn_t_sm50.cu => sm50_simt_minimum_multiplies_ssrgemm_nn_t.cu} (100%) rename bench/device/{simt_minimum_multiplies_ssrgemm_nt_n_sm50.cu => sm50_simt_minimum_multiplies_ssrgemm_nt_n.cu} (100%) rename bench/device/{simt_minimum_multiplies_ssrgemm_nt_t_sm50.cu => sm50_simt_minimum_multiplies_ssrgemm_nt_t.cu} (100%) rename bench/device/{simt_minimum_multiplies_ssrgemm_tn_n_sm50.cu => sm50_simt_minimum_multiplies_ssrgemm_tn_n.cu} (100%) rename bench/device/{simt_minimum_multiplies_ssrgemm_tn_t_sm50.cu => sm50_simt_minimum_multiplies_ssrgemm_tn_t.cu} (100%) rename bench/device/{simt_minimum_multiplies_ssrgemm_tt_n_sm50.cu => sm50_simt_minimum_multiplies_ssrgemm_tt_n.cu} (100%) rename bench/device/{simt_minimum_multiplies_ssrgemm_tt_t_sm50.cu => sm50_simt_minimum_multiplies_ssrgemm_tt_t.cu} (100%) rename bench/device/{simt_minimum_plus_dsrgemm_nn_n_sm50.cu => sm50_simt_minimum_plus_dsrgemm_nn_n.cu} (100%) rename bench/device/{simt_minimum_plus_dsrgemm_nn_t_sm50.cu => sm50_simt_minimum_plus_dsrgemm_nn_t.cu} (100%) rename bench/device/{simt_minimum_plus_dsrgemm_nt_n_sm50.cu => sm50_simt_minimum_plus_dsrgemm_nt_n.cu} (100%) rename bench/device/{simt_minimum_plus_dsrgemm_nt_t_sm50.cu => sm50_simt_minimum_plus_dsrgemm_nt_t.cu} (100%) rename bench/device/{simt_minimum_plus_dsrgemm_tn_n_sm50.cu => sm50_simt_minimum_plus_dsrgemm_tn_n.cu} (100%) rename bench/device/{simt_minimum_plus_dsrgemm_tn_t_sm50.cu => sm50_simt_minimum_plus_dsrgemm_tn_t.cu} (100%) rename bench/device/{simt_minimum_plus_dsrgemm_tt_n_sm50.cu => sm50_simt_minimum_plus_dsrgemm_tt_n.cu} (100%) rename bench/device/{simt_minimum_plus_dsrgemm_tt_t_sm50.cu => sm50_simt_minimum_plus_dsrgemm_tt_t.cu} (100%) rename bench/device/{simt_minimum_plus_ssrgemm_nn_n_sm50.cu => sm50_simt_minimum_plus_ssrgemm_nn_n.cu} (100%) rename bench/device/{simt_minimum_plus_ssrgemm_nn_t_sm50.cu => sm50_simt_minimum_plus_ssrgemm_nn_t.cu} (100%) rename bench/device/{simt_minimum_plus_ssrgemm_nt_n_sm50.cu => sm50_simt_minimum_plus_ssrgemm_nt_n.cu} (100%) rename bench/device/{simt_minimum_plus_ssrgemm_nt_t_sm50.cu => sm50_simt_minimum_plus_ssrgemm_nt_t.cu} (100%) rename bench/device/{simt_minimum_plus_ssrgemm_tn_n_sm50.cu => sm50_simt_minimum_plus_ssrgemm_tn_n.cu} (100%) rename bench/device/{simt_minimum_plus_ssrgemm_tn_t_sm50.cu => sm50_simt_minimum_plus_ssrgemm_tn_t.cu} (100%) rename bench/device/{simt_minimum_plus_ssrgemm_tt_n_sm50.cu => sm50_simt_minimum_plus_ssrgemm_tt_n.cu} (100%) rename bench/device/{simt_minimum_plus_ssrgemm_tt_t_sm50.cu => sm50_simt_minimum_plus_ssrgemm_tt_t.cu} (100%) rename bench/device/{simt_plus_multiplies_dsrgemm_nn_n_sm50.cu => sm50_simt_plus_multiplies_dsrgemm_nn_n.cu} (100%) rename bench/device/{simt_plus_multiplies_dsrgemm_nn_t_sm50.cu => sm50_simt_plus_multiplies_dsrgemm_nn_t.cu} (100%) rename bench/device/{simt_plus_multiplies_dsrgemm_nt_n_sm50.cu => sm50_simt_plus_multiplies_dsrgemm_nt_n.cu} (100%) rename bench/device/{simt_plus_multiplies_dsrgemm_nt_t_sm50.cu => sm50_simt_plus_multiplies_dsrgemm_nt_t.cu} (100%) rename bench/device/{simt_plus_multiplies_dsrgemm_tn_n_sm50.cu => sm50_simt_plus_multiplies_dsrgemm_tn_n.cu} (100%) rename bench/device/{simt_plus_multiplies_dsrgemm_tn_t_sm50.cu => sm50_simt_plus_multiplies_dsrgemm_tn_t.cu} (100%) rename bench/device/{simt_plus_multiplies_dsrgemm_tt_n_sm50.cu => sm50_simt_plus_multiplies_dsrgemm_tt_n.cu} (100%) rename bench/device/{simt_plus_multiplies_dsrgemm_tt_t_sm50.cu => sm50_simt_plus_multiplies_dsrgemm_tt_t.cu} (100%) rename bench/device/{simt_plus_multiplies_ssrgemm_nn_n_sm50.cu => sm50_simt_plus_multiplies_ssrgemm_nn_n.cu} (100%) rename bench/device/{simt_plus_multiplies_ssrgemm_nn_t_sm50.cu => sm50_simt_plus_multiplies_ssrgemm_nn_t.cu} (100%) rename bench/device/{simt_plus_multiplies_ssrgemm_nt_n_sm50.cu => sm50_simt_plus_multiplies_ssrgemm_nt_n.cu} (100%) rename bench/device/{simt_plus_multiplies_ssrgemm_nt_t_sm50.cu => sm50_simt_plus_multiplies_ssrgemm_nt_t.cu} (100%) rename bench/device/{simt_plus_multiplies_ssrgemm_tn_n_sm50.cu => sm50_simt_plus_multiplies_ssrgemm_tn_n.cu} (100%) rename bench/device/{simt_plus_multiplies_ssrgemm_tn_t_sm50.cu => sm50_simt_plus_multiplies_ssrgemm_tn_t.cu} (100%) rename bench/device/{simt_plus_multiplies_ssrgemm_tt_n_sm50.cu => sm50_simt_plus_multiplies_ssrgemm_tt_n.cu} (100%) rename bench/device/{simt_plus_multiplies_ssrgemm_tt_t_sm50.cu => sm50_simt_plus_multiplies_ssrgemm_tt_t.cu} (100%) diff --git a/bench/device/simt_sm50.py b/bench/device/gen_simt.py similarity index 92% rename from bench/device/simt_sm50.py rename to bench/device/gen_simt.py index bfe6065..6e884c8 100644 --- a/bench/device/simt_sm50.py +++ b/bench/device/gen_simt.py @@ -1,4 +1,6 @@ import os +import sys +import argparse # this file creates the bench/unit/gemm/device simt benchmarks and the CMake file to go with it ################################################################################ @@ -83,11 +85,11 @@ bench_template = """\ #if defined(CUASR_BENCH_LEVEL) and (CUASR_BENCH_LEVEL >= {21}) -static void BM_SM50_device_{0}_{1}_{2}srgemm_{4}{5}_{6}_{10}x{11}x{12}_{13}x{14}x1_{15}x{16}_{17}x{18}_{19}x{20}(benchmark::State &state) {{ +static void BM_SM{22}_device_{0}_{1}_{2}srgemm_{4}{5}_{6}_{10}x{11}x{12}_{13}x{14}x1_{15}x{16}_{17}x{18}_{19}x{20}(benchmark::State &state) {{ const auto N = static_cast(state.range(0)); using precision = {3}; using OpClass = cutlass::arch::OpClassSimt; - using SmArch = cutlass::arch::Sm50; + using SmArch = cutlass::arch::Sm{22}; using ThreadblockShape = cutlass::gemm::GemmShape<{10}, {11}, {12}>; using WarpShape = cutlass::gemm::GemmShape<{13}, {14}, {12}>; @@ -123,7 +125,7 @@ state.counters["Flop/s"] = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); }} -BENCHMARK(BM_SM50_device_{0}_{1}_{2}srgemm_{4}{5}_{6}_{10}x{11}x{12}_{13}x{14}x1_{15}x{16}_{17}x{18}_{19}x{20}) +BENCHMARK(BM_SM{22}_device_{0}_{1}_{2}srgemm_{4}{5}_{6}_{10}x{11}x{12}_{13}x{14}x1_{15}x{16}_{17}x{18}_{19}x{20}) ->RangeMultiplier(2)->Range(256, 4096); #endif @@ -151,7 +153,8 @@ def write_benchmark_to_file( warp_threadsM, warp_threadsN, warps_per_tb, - bench_level): + bench_level, + sm_arch): print("{:.0f}x{:.0f}x{:.0f}__{:.0f}x{:.0f}_{:.0f}x{:.0f}_{:.0f}x{:.0f}".format( threadblock_tile[0], threadblock_tile[1], unroll, thread_tileM, thread_tileN, @@ -191,11 +194,12 @@ def write_benchmark_to_file( int(warp_threadsN), # 18 int(warps_per_tb[0]), # 19 int(warps_per_tb[1]), # 20 - int(bench_level) # 21 + int(bench_level), # 21 + int(sm_arch) # 22 )) -def main(output_dir: str): +def main(args): # warps per threadblock warps_per_threadblocks = [] for warps_per_tb0 in WARPS_PER_TB_EDGE: @@ -247,12 +251,12 @@ def main(output_dir: str): transC = "n" if column_major_C else "t" # open file - benchfile_name = "simt_{}_{}_{}srgemm_{}{}_{}_sm50.cu".format( - add_op, mult_op, precision_char, + benchfile_name = "sm{}_simt_{}_{}_{}srgemm_{}{}_{}.cu".format( + args.sm_arch, add_op, mult_op, precision_char, transA, transB, transC) print("\n", benchfile_name) - filePath = os.path.join(output_dir, benchfile_name) + filePath = os.path.join(args.output_dir, benchfile_name) with open(filePath, "w") as benchfile: write_benchmark_file_header(benchfile) @@ -367,12 +371,18 @@ def main(output_dir: str): warp_threadsM, warp_threadsN, warps_per_tb, - bench_level) + bench_level, + args.sm_arch) num_benches += 1 print("Benchmarks per level = {}, {}, {}".format(benchcount_L0, benchcount_L1, benchcount_L2)) print("Total bench count per semi-ring = {}".format(num_benches // len(semiring_operators))) - if __name__ == "__main__": - main(".") + parser = argparse.ArgumentParser() + parser.add_argument("-o", "--output-dir", type=str, required=False, default=".", + help="Path to the output dir.") + parser.add_argument("-sm", "--sm-arch", type=int, required=False, default=50, choices=[50, 80], + help="SM architecture version number,") + args = parser.parse_args(sys.argv[1:]) + main(args) diff --git a/bench/device/simt_binary_or_binary_and_dsrgemm_nn_n_sm50.cu b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_n.cu similarity index 100% rename from bench/device/simt_binary_or_binary_and_dsrgemm_nn_n_sm50.cu rename to bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_n.cu diff --git a/bench/device/simt_binary_or_binary_and_dsrgemm_nn_t_sm50.cu b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_t.cu similarity index 100% rename from bench/device/simt_binary_or_binary_and_dsrgemm_nn_t_sm50.cu rename to bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_t.cu diff --git a/bench/device/simt_binary_or_binary_and_dsrgemm_nt_n_sm50.cu b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_n.cu similarity index 100% rename from bench/device/simt_binary_or_binary_and_dsrgemm_nt_n_sm50.cu rename to bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_n.cu diff --git a/bench/device/simt_binary_or_binary_and_dsrgemm_nt_t_sm50.cu b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_t.cu similarity index 100% rename from bench/device/simt_binary_or_binary_and_dsrgemm_nt_t_sm50.cu rename to bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_t.cu diff --git a/bench/device/simt_binary_or_binary_and_dsrgemm_tn_n_sm50.cu b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_n.cu similarity index 100% rename from bench/device/simt_binary_or_binary_and_dsrgemm_tn_n_sm50.cu rename to bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_n.cu diff --git a/bench/device/simt_binary_or_binary_and_dsrgemm_tn_t_sm50.cu b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_t.cu similarity index 100% rename from bench/device/simt_binary_or_binary_and_dsrgemm_tn_t_sm50.cu rename to bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_t.cu diff --git a/bench/device/simt_binary_or_binary_and_dsrgemm_tt_n_sm50.cu b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_n.cu similarity index 100% rename from bench/device/simt_binary_or_binary_and_dsrgemm_tt_n_sm50.cu rename to bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_n.cu diff --git a/bench/device/simt_binary_or_binary_and_dsrgemm_tt_t_sm50.cu b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_t.cu similarity index 100% rename from bench/device/simt_binary_or_binary_and_dsrgemm_tt_t_sm50.cu rename to bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_t.cu diff --git a/bench/device/simt_binary_or_binary_and_ssrgemm_nn_n_sm50.cu b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_n.cu similarity index 100% rename from bench/device/simt_binary_or_binary_and_ssrgemm_nn_n_sm50.cu rename to bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_n.cu diff --git a/bench/device/simt_binary_or_binary_and_ssrgemm_nn_t_sm50.cu b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_t.cu similarity index 100% rename from bench/device/simt_binary_or_binary_and_ssrgemm_nn_t_sm50.cu rename to bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_t.cu diff --git a/bench/device/simt_binary_or_binary_and_ssrgemm_nt_n_sm50.cu b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_n.cu similarity index 100% rename from bench/device/simt_binary_or_binary_and_ssrgemm_nt_n_sm50.cu rename to bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_n.cu diff --git a/bench/device/simt_binary_or_binary_and_ssrgemm_nt_t_sm50.cu b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_t.cu similarity index 100% rename from bench/device/simt_binary_or_binary_and_ssrgemm_nt_t_sm50.cu rename to bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_t.cu diff --git a/bench/device/simt_binary_or_binary_and_ssrgemm_tn_n_sm50.cu b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_n.cu similarity index 100% rename from bench/device/simt_binary_or_binary_and_ssrgemm_tn_n_sm50.cu rename to bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_n.cu diff --git a/bench/device/simt_binary_or_binary_and_ssrgemm_tn_t_sm50.cu b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_t.cu similarity index 100% rename from bench/device/simt_binary_or_binary_and_ssrgemm_tn_t_sm50.cu rename to bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_t.cu diff --git a/bench/device/simt_binary_or_binary_and_ssrgemm_tt_n_sm50.cu b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_n.cu similarity index 100% rename from bench/device/simt_binary_or_binary_and_ssrgemm_tt_n_sm50.cu rename to bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_n.cu diff --git a/bench/device/simt_binary_or_binary_and_ssrgemm_tt_t_sm50.cu b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_t.cu similarity index 100% rename from bench/device/simt_binary_or_binary_and_ssrgemm_tt_t_sm50.cu rename to bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_t.cu diff --git a/bench/device/simt_maximum_minimum_dsrgemm_nn_n_sm50.cu b/bench/device/sm50_simt_maximum_minimum_dsrgemm_nn_n.cu similarity index 100% rename from bench/device/simt_maximum_minimum_dsrgemm_nn_n_sm50.cu rename to bench/device/sm50_simt_maximum_minimum_dsrgemm_nn_n.cu diff --git a/bench/device/simt_maximum_minimum_dsrgemm_nn_t_sm50.cu b/bench/device/sm50_simt_maximum_minimum_dsrgemm_nn_t.cu similarity index 100% rename from bench/device/simt_maximum_minimum_dsrgemm_nn_t_sm50.cu rename to bench/device/sm50_simt_maximum_minimum_dsrgemm_nn_t.cu diff --git a/bench/device/simt_maximum_minimum_dsrgemm_nt_n_sm50.cu b/bench/device/sm50_simt_maximum_minimum_dsrgemm_nt_n.cu similarity index 100% rename from bench/device/simt_maximum_minimum_dsrgemm_nt_n_sm50.cu rename to bench/device/sm50_simt_maximum_minimum_dsrgemm_nt_n.cu diff --git a/bench/device/simt_maximum_minimum_dsrgemm_nt_t_sm50.cu b/bench/device/sm50_simt_maximum_minimum_dsrgemm_nt_t.cu similarity index 100% rename from bench/device/simt_maximum_minimum_dsrgemm_nt_t_sm50.cu rename to bench/device/sm50_simt_maximum_minimum_dsrgemm_nt_t.cu diff --git a/bench/device/simt_maximum_minimum_dsrgemm_tn_n_sm50.cu b/bench/device/sm50_simt_maximum_minimum_dsrgemm_tn_n.cu similarity index 100% rename from bench/device/simt_maximum_minimum_dsrgemm_tn_n_sm50.cu rename to bench/device/sm50_simt_maximum_minimum_dsrgemm_tn_n.cu diff --git a/bench/device/simt_maximum_minimum_dsrgemm_tn_t_sm50.cu b/bench/device/sm50_simt_maximum_minimum_dsrgemm_tn_t.cu similarity index 100% rename from bench/device/simt_maximum_minimum_dsrgemm_tn_t_sm50.cu rename to bench/device/sm50_simt_maximum_minimum_dsrgemm_tn_t.cu diff --git a/bench/device/simt_maximum_minimum_dsrgemm_tt_n_sm50.cu b/bench/device/sm50_simt_maximum_minimum_dsrgemm_tt_n.cu similarity index 100% rename from bench/device/simt_maximum_minimum_dsrgemm_tt_n_sm50.cu rename to bench/device/sm50_simt_maximum_minimum_dsrgemm_tt_n.cu diff --git a/bench/device/simt_maximum_minimum_dsrgemm_tt_t_sm50.cu b/bench/device/sm50_simt_maximum_minimum_dsrgemm_tt_t.cu similarity index 100% rename from bench/device/simt_maximum_minimum_dsrgemm_tt_t_sm50.cu rename to bench/device/sm50_simt_maximum_minimum_dsrgemm_tt_t.cu diff --git a/bench/device/simt_maximum_minimum_ssrgemm_nn_n_sm50.cu b/bench/device/sm50_simt_maximum_minimum_ssrgemm_nn_n.cu similarity index 100% rename from bench/device/simt_maximum_minimum_ssrgemm_nn_n_sm50.cu rename to bench/device/sm50_simt_maximum_minimum_ssrgemm_nn_n.cu diff --git a/bench/device/simt_maximum_minimum_ssrgemm_nn_t_sm50.cu b/bench/device/sm50_simt_maximum_minimum_ssrgemm_nn_t.cu similarity index 100% rename from bench/device/simt_maximum_minimum_ssrgemm_nn_t_sm50.cu rename to bench/device/sm50_simt_maximum_minimum_ssrgemm_nn_t.cu diff --git a/bench/device/simt_maximum_minimum_ssrgemm_nt_n_sm50.cu b/bench/device/sm50_simt_maximum_minimum_ssrgemm_nt_n.cu similarity index 100% rename from bench/device/simt_maximum_minimum_ssrgemm_nt_n_sm50.cu rename to bench/device/sm50_simt_maximum_minimum_ssrgemm_nt_n.cu diff --git a/bench/device/simt_maximum_minimum_ssrgemm_nt_t_sm50.cu b/bench/device/sm50_simt_maximum_minimum_ssrgemm_nt_t.cu similarity index 100% rename from bench/device/simt_maximum_minimum_ssrgemm_nt_t_sm50.cu rename to bench/device/sm50_simt_maximum_minimum_ssrgemm_nt_t.cu diff --git a/bench/device/simt_maximum_minimum_ssrgemm_tn_n_sm50.cu b/bench/device/sm50_simt_maximum_minimum_ssrgemm_tn_n.cu similarity index 100% rename from bench/device/simt_maximum_minimum_ssrgemm_tn_n_sm50.cu rename to bench/device/sm50_simt_maximum_minimum_ssrgemm_tn_n.cu diff --git a/bench/device/simt_maximum_minimum_ssrgemm_tn_t_sm50.cu b/bench/device/sm50_simt_maximum_minimum_ssrgemm_tn_t.cu similarity index 100% rename from bench/device/simt_maximum_minimum_ssrgemm_tn_t_sm50.cu rename to bench/device/sm50_simt_maximum_minimum_ssrgemm_tn_t.cu diff --git a/bench/device/simt_maximum_minimum_ssrgemm_tt_n_sm50.cu b/bench/device/sm50_simt_maximum_minimum_ssrgemm_tt_n.cu similarity index 100% rename from bench/device/simt_maximum_minimum_ssrgemm_tt_n_sm50.cu rename to bench/device/sm50_simt_maximum_minimum_ssrgemm_tt_n.cu diff --git a/bench/device/simt_maximum_minimum_ssrgemm_tt_t_sm50.cu b/bench/device/sm50_simt_maximum_minimum_ssrgemm_tt_t.cu similarity index 100% rename from bench/device/simt_maximum_minimum_ssrgemm_tt_t_sm50.cu rename to bench/device/sm50_simt_maximum_minimum_ssrgemm_tt_t.cu diff --git a/bench/device/simt_maximum_multiplies_dsrgemm_nn_n_sm50.cu b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nn_n.cu similarity index 100% rename from bench/device/simt_maximum_multiplies_dsrgemm_nn_n_sm50.cu rename to bench/device/sm50_simt_maximum_multiplies_dsrgemm_nn_n.cu diff --git a/bench/device/simt_maximum_multiplies_dsrgemm_nn_t_sm50.cu b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nn_t.cu similarity index 100% rename from bench/device/simt_maximum_multiplies_dsrgemm_nn_t_sm50.cu rename to bench/device/sm50_simt_maximum_multiplies_dsrgemm_nn_t.cu diff --git a/bench/device/simt_maximum_multiplies_dsrgemm_nt_n_sm50.cu b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nt_n.cu similarity index 100% rename from bench/device/simt_maximum_multiplies_dsrgemm_nt_n_sm50.cu rename to bench/device/sm50_simt_maximum_multiplies_dsrgemm_nt_n.cu diff --git a/bench/device/simt_maximum_multiplies_dsrgemm_nt_t_sm50.cu b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nt_t.cu similarity index 100% rename from bench/device/simt_maximum_multiplies_dsrgemm_nt_t_sm50.cu rename to bench/device/sm50_simt_maximum_multiplies_dsrgemm_nt_t.cu diff --git a/bench/device/simt_maximum_multiplies_dsrgemm_tn_n_sm50.cu b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tn_n.cu similarity index 100% rename from bench/device/simt_maximum_multiplies_dsrgemm_tn_n_sm50.cu rename to bench/device/sm50_simt_maximum_multiplies_dsrgemm_tn_n.cu diff --git a/bench/device/simt_maximum_multiplies_dsrgemm_tn_t_sm50.cu b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tn_t.cu similarity index 100% rename from bench/device/simt_maximum_multiplies_dsrgemm_tn_t_sm50.cu rename to bench/device/sm50_simt_maximum_multiplies_dsrgemm_tn_t.cu diff --git a/bench/device/simt_maximum_multiplies_dsrgemm_tt_n_sm50.cu b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tt_n.cu similarity index 100% rename from bench/device/simt_maximum_multiplies_dsrgemm_tt_n_sm50.cu rename to bench/device/sm50_simt_maximum_multiplies_dsrgemm_tt_n.cu diff --git a/bench/device/simt_maximum_multiplies_dsrgemm_tt_t_sm50.cu b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tt_t.cu similarity index 100% rename from bench/device/simt_maximum_multiplies_dsrgemm_tt_t_sm50.cu rename to bench/device/sm50_simt_maximum_multiplies_dsrgemm_tt_t.cu diff --git a/bench/device/simt_maximum_multiplies_ssrgemm_nn_n_sm50.cu b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nn_n.cu similarity index 100% rename from bench/device/simt_maximum_multiplies_ssrgemm_nn_n_sm50.cu rename to bench/device/sm50_simt_maximum_multiplies_ssrgemm_nn_n.cu diff --git a/bench/device/simt_maximum_multiplies_ssrgemm_nn_t_sm50.cu b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nn_t.cu similarity index 100% rename from bench/device/simt_maximum_multiplies_ssrgemm_nn_t_sm50.cu rename to bench/device/sm50_simt_maximum_multiplies_ssrgemm_nn_t.cu diff --git a/bench/device/simt_maximum_multiplies_ssrgemm_nt_n_sm50.cu b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nt_n.cu similarity index 100% rename from bench/device/simt_maximum_multiplies_ssrgemm_nt_n_sm50.cu rename to bench/device/sm50_simt_maximum_multiplies_ssrgemm_nt_n.cu diff --git a/bench/device/simt_maximum_multiplies_ssrgemm_nt_t_sm50.cu b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nt_t.cu similarity index 100% rename from bench/device/simt_maximum_multiplies_ssrgemm_nt_t_sm50.cu rename to bench/device/sm50_simt_maximum_multiplies_ssrgemm_nt_t.cu diff --git a/bench/device/simt_maximum_multiplies_ssrgemm_tn_n_sm50.cu b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tn_n.cu similarity index 100% rename from bench/device/simt_maximum_multiplies_ssrgemm_tn_n_sm50.cu rename to bench/device/sm50_simt_maximum_multiplies_ssrgemm_tn_n.cu diff --git a/bench/device/simt_maximum_multiplies_ssrgemm_tn_t_sm50.cu b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tn_t.cu similarity index 100% rename from bench/device/simt_maximum_multiplies_ssrgemm_tn_t_sm50.cu rename to bench/device/sm50_simt_maximum_multiplies_ssrgemm_tn_t.cu diff --git a/bench/device/simt_maximum_multiplies_ssrgemm_tt_n_sm50.cu b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tt_n.cu similarity index 100% rename from bench/device/simt_maximum_multiplies_ssrgemm_tt_n_sm50.cu rename to bench/device/sm50_simt_maximum_multiplies_ssrgemm_tt_n.cu diff --git a/bench/device/simt_maximum_multiplies_ssrgemm_tt_t_sm50.cu b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tt_t.cu similarity index 100% rename from bench/device/simt_maximum_multiplies_ssrgemm_tt_t_sm50.cu rename to bench/device/sm50_simt_maximum_multiplies_ssrgemm_tt_t.cu diff --git a/bench/device/simt_maximum_plus_dsrgemm_nn_n_sm50.cu b/bench/device/sm50_simt_maximum_plus_dsrgemm_nn_n.cu similarity index 100% rename from bench/device/simt_maximum_plus_dsrgemm_nn_n_sm50.cu rename to bench/device/sm50_simt_maximum_plus_dsrgemm_nn_n.cu diff --git a/bench/device/simt_maximum_plus_dsrgemm_nn_t_sm50.cu b/bench/device/sm50_simt_maximum_plus_dsrgemm_nn_t.cu similarity index 100% rename from bench/device/simt_maximum_plus_dsrgemm_nn_t_sm50.cu rename to bench/device/sm50_simt_maximum_plus_dsrgemm_nn_t.cu diff --git a/bench/device/simt_maximum_plus_dsrgemm_nt_n_sm50.cu b/bench/device/sm50_simt_maximum_plus_dsrgemm_nt_n.cu similarity index 100% rename from bench/device/simt_maximum_plus_dsrgemm_nt_n_sm50.cu rename to bench/device/sm50_simt_maximum_plus_dsrgemm_nt_n.cu diff --git a/bench/device/simt_maximum_plus_dsrgemm_nt_t_sm50.cu b/bench/device/sm50_simt_maximum_plus_dsrgemm_nt_t.cu similarity index 100% rename from bench/device/simt_maximum_plus_dsrgemm_nt_t_sm50.cu rename to bench/device/sm50_simt_maximum_plus_dsrgemm_nt_t.cu diff --git a/bench/device/simt_maximum_plus_dsrgemm_tn_n_sm50.cu b/bench/device/sm50_simt_maximum_plus_dsrgemm_tn_n.cu similarity index 100% rename from bench/device/simt_maximum_plus_dsrgemm_tn_n_sm50.cu rename to bench/device/sm50_simt_maximum_plus_dsrgemm_tn_n.cu diff --git a/bench/device/simt_maximum_plus_dsrgemm_tn_t_sm50.cu b/bench/device/sm50_simt_maximum_plus_dsrgemm_tn_t.cu similarity index 100% rename from bench/device/simt_maximum_plus_dsrgemm_tn_t_sm50.cu rename to bench/device/sm50_simt_maximum_plus_dsrgemm_tn_t.cu diff --git a/bench/device/simt_maximum_plus_dsrgemm_tt_n_sm50.cu b/bench/device/sm50_simt_maximum_plus_dsrgemm_tt_n.cu similarity index 100% rename from bench/device/simt_maximum_plus_dsrgemm_tt_n_sm50.cu rename to bench/device/sm50_simt_maximum_plus_dsrgemm_tt_n.cu diff --git a/bench/device/simt_maximum_plus_dsrgemm_tt_t_sm50.cu b/bench/device/sm50_simt_maximum_plus_dsrgemm_tt_t.cu similarity index 100% rename from bench/device/simt_maximum_plus_dsrgemm_tt_t_sm50.cu rename to bench/device/sm50_simt_maximum_plus_dsrgemm_tt_t.cu diff --git a/bench/device/simt_maximum_plus_ssrgemm_nn_n_sm50.cu b/bench/device/sm50_simt_maximum_plus_ssrgemm_nn_n.cu similarity index 100% rename from bench/device/simt_maximum_plus_ssrgemm_nn_n_sm50.cu rename to bench/device/sm50_simt_maximum_plus_ssrgemm_nn_n.cu diff --git a/bench/device/simt_maximum_plus_ssrgemm_nn_t_sm50.cu b/bench/device/sm50_simt_maximum_plus_ssrgemm_nn_t.cu similarity index 100% rename from bench/device/simt_maximum_plus_ssrgemm_nn_t_sm50.cu rename to bench/device/sm50_simt_maximum_plus_ssrgemm_nn_t.cu diff --git a/bench/device/simt_maximum_plus_ssrgemm_nt_n_sm50.cu b/bench/device/sm50_simt_maximum_plus_ssrgemm_nt_n.cu similarity index 100% rename from bench/device/simt_maximum_plus_ssrgemm_nt_n_sm50.cu rename to bench/device/sm50_simt_maximum_plus_ssrgemm_nt_n.cu diff --git a/bench/device/simt_maximum_plus_ssrgemm_nt_t_sm50.cu b/bench/device/sm50_simt_maximum_plus_ssrgemm_nt_t.cu similarity index 100% rename from bench/device/simt_maximum_plus_ssrgemm_nt_t_sm50.cu rename to bench/device/sm50_simt_maximum_plus_ssrgemm_nt_t.cu diff --git a/bench/device/simt_maximum_plus_ssrgemm_tn_n_sm50.cu b/bench/device/sm50_simt_maximum_plus_ssrgemm_tn_n.cu similarity index 100% rename from bench/device/simt_maximum_plus_ssrgemm_tn_n_sm50.cu rename to bench/device/sm50_simt_maximum_plus_ssrgemm_tn_n.cu diff --git a/bench/device/simt_maximum_plus_ssrgemm_tn_t_sm50.cu b/bench/device/sm50_simt_maximum_plus_ssrgemm_tn_t.cu similarity index 100% rename from bench/device/simt_maximum_plus_ssrgemm_tn_t_sm50.cu rename to bench/device/sm50_simt_maximum_plus_ssrgemm_tn_t.cu diff --git a/bench/device/simt_maximum_plus_ssrgemm_tt_n_sm50.cu b/bench/device/sm50_simt_maximum_plus_ssrgemm_tt_n.cu similarity index 100% rename from bench/device/simt_maximum_plus_ssrgemm_tt_n_sm50.cu rename to bench/device/sm50_simt_maximum_plus_ssrgemm_tt_n.cu diff --git a/bench/device/simt_maximum_plus_ssrgemm_tt_t_sm50.cu b/bench/device/sm50_simt_maximum_plus_ssrgemm_tt_t.cu similarity index 100% rename from bench/device/simt_maximum_plus_ssrgemm_tt_t_sm50.cu rename to bench/device/sm50_simt_maximum_plus_ssrgemm_tt_t.cu diff --git a/bench/device/simt_minimum_maximum_dsrgemm_nn_n_sm50.cu b/bench/device/sm50_simt_minimum_maximum_dsrgemm_nn_n.cu similarity index 100% rename from bench/device/simt_minimum_maximum_dsrgemm_nn_n_sm50.cu rename to bench/device/sm50_simt_minimum_maximum_dsrgemm_nn_n.cu diff --git a/bench/device/simt_minimum_maximum_dsrgemm_nn_t_sm50.cu b/bench/device/sm50_simt_minimum_maximum_dsrgemm_nn_t.cu similarity index 100% rename from bench/device/simt_minimum_maximum_dsrgemm_nn_t_sm50.cu rename to bench/device/sm50_simt_minimum_maximum_dsrgemm_nn_t.cu diff --git a/bench/device/simt_minimum_maximum_dsrgemm_nt_n_sm50.cu b/bench/device/sm50_simt_minimum_maximum_dsrgemm_nt_n.cu similarity index 100% rename from bench/device/simt_minimum_maximum_dsrgemm_nt_n_sm50.cu rename to bench/device/sm50_simt_minimum_maximum_dsrgemm_nt_n.cu diff --git a/bench/device/simt_minimum_maximum_dsrgemm_nt_t_sm50.cu b/bench/device/sm50_simt_minimum_maximum_dsrgemm_nt_t.cu similarity index 100% rename from bench/device/simt_minimum_maximum_dsrgemm_nt_t_sm50.cu rename to bench/device/sm50_simt_minimum_maximum_dsrgemm_nt_t.cu diff --git a/bench/device/simt_minimum_maximum_dsrgemm_tn_n_sm50.cu b/bench/device/sm50_simt_minimum_maximum_dsrgemm_tn_n.cu similarity index 100% rename from bench/device/simt_minimum_maximum_dsrgemm_tn_n_sm50.cu rename to bench/device/sm50_simt_minimum_maximum_dsrgemm_tn_n.cu diff --git a/bench/device/simt_minimum_maximum_dsrgemm_tn_t_sm50.cu b/bench/device/sm50_simt_minimum_maximum_dsrgemm_tn_t.cu similarity index 100% rename from bench/device/simt_minimum_maximum_dsrgemm_tn_t_sm50.cu rename to bench/device/sm50_simt_minimum_maximum_dsrgemm_tn_t.cu diff --git a/bench/device/simt_minimum_maximum_dsrgemm_tt_n_sm50.cu b/bench/device/sm50_simt_minimum_maximum_dsrgemm_tt_n.cu similarity index 100% rename from bench/device/simt_minimum_maximum_dsrgemm_tt_n_sm50.cu rename to bench/device/sm50_simt_minimum_maximum_dsrgemm_tt_n.cu diff --git a/bench/device/simt_minimum_maximum_dsrgemm_tt_t_sm50.cu b/bench/device/sm50_simt_minimum_maximum_dsrgemm_tt_t.cu similarity index 100% rename from bench/device/simt_minimum_maximum_dsrgemm_tt_t_sm50.cu rename to bench/device/sm50_simt_minimum_maximum_dsrgemm_tt_t.cu diff --git a/bench/device/simt_minimum_maximum_ssrgemm_nn_n_sm50.cu b/bench/device/sm50_simt_minimum_maximum_ssrgemm_nn_n.cu similarity index 100% rename from bench/device/simt_minimum_maximum_ssrgemm_nn_n_sm50.cu rename to bench/device/sm50_simt_minimum_maximum_ssrgemm_nn_n.cu diff --git a/bench/device/simt_minimum_maximum_ssrgemm_nn_t_sm50.cu b/bench/device/sm50_simt_minimum_maximum_ssrgemm_nn_t.cu similarity index 100% rename from bench/device/simt_minimum_maximum_ssrgemm_nn_t_sm50.cu rename to bench/device/sm50_simt_minimum_maximum_ssrgemm_nn_t.cu diff --git a/bench/device/simt_minimum_maximum_ssrgemm_nt_n_sm50.cu b/bench/device/sm50_simt_minimum_maximum_ssrgemm_nt_n.cu similarity index 100% rename from bench/device/simt_minimum_maximum_ssrgemm_nt_n_sm50.cu rename to bench/device/sm50_simt_minimum_maximum_ssrgemm_nt_n.cu diff --git a/bench/device/simt_minimum_maximum_ssrgemm_nt_t_sm50.cu b/bench/device/sm50_simt_minimum_maximum_ssrgemm_nt_t.cu similarity index 100% rename from bench/device/simt_minimum_maximum_ssrgemm_nt_t_sm50.cu rename to bench/device/sm50_simt_minimum_maximum_ssrgemm_nt_t.cu diff --git a/bench/device/simt_minimum_maximum_ssrgemm_tn_n_sm50.cu b/bench/device/sm50_simt_minimum_maximum_ssrgemm_tn_n.cu similarity index 100% rename from bench/device/simt_minimum_maximum_ssrgemm_tn_n_sm50.cu rename to bench/device/sm50_simt_minimum_maximum_ssrgemm_tn_n.cu diff --git a/bench/device/simt_minimum_maximum_ssrgemm_tn_t_sm50.cu b/bench/device/sm50_simt_minimum_maximum_ssrgemm_tn_t.cu similarity index 100% rename from bench/device/simt_minimum_maximum_ssrgemm_tn_t_sm50.cu rename to bench/device/sm50_simt_minimum_maximum_ssrgemm_tn_t.cu diff --git a/bench/device/simt_minimum_maximum_ssrgemm_tt_n_sm50.cu b/bench/device/sm50_simt_minimum_maximum_ssrgemm_tt_n.cu similarity index 100% rename from bench/device/simt_minimum_maximum_ssrgemm_tt_n_sm50.cu rename to bench/device/sm50_simt_minimum_maximum_ssrgemm_tt_n.cu diff --git a/bench/device/simt_minimum_maximum_ssrgemm_tt_t_sm50.cu b/bench/device/sm50_simt_minimum_maximum_ssrgemm_tt_t.cu similarity index 100% rename from bench/device/simt_minimum_maximum_ssrgemm_tt_t_sm50.cu rename to bench/device/sm50_simt_minimum_maximum_ssrgemm_tt_t.cu diff --git a/bench/device/simt_minimum_multiplies_dsrgemm_nn_n_sm50.cu b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nn_n.cu similarity index 100% rename from bench/device/simt_minimum_multiplies_dsrgemm_nn_n_sm50.cu rename to bench/device/sm50_simt_minimum_multiplies_dsrgemm_nn_n.cu diff --git a/bench/device/simt_minimum_multiplies_dsrgemm_nn_t_sm50.cu b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nn_t.cu similarity index 100% rename from bench/device/simt_minimum_multiplies_dsrgemm_nn_t_sm50.cu rename to bench/device/sm50_simt_minimum_multiplies_dsrgemm_nn_t.cu diff --git a/bench/device/simt_minimum_multiplies_dsrgemm_nt_n_sm50.cu b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nt_n.cu similarity index 100% rename from bench/device/simt_minimum_multiplies_dsrgemm_nt_n_sm50.cu rename to bench/device/sm50_simt_minimum_multiplies_dsrgemm_nt_n.cu diff --git a/bench/device/simt_minimum_multiplies_dsrgemm_nt_t_sm50.cu b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nt_t.cu similarity index 100% rename from bench/device/simt_minimum_multiplies_dsrgemm_nt_t_sm50.cu rename to bench/device/sm50_simt_minimum_multiplies_dsrgemm_nt_t.cu diff --git a/bench/device/simt_minimum_multiplies_dsrgemm_tn_n_sm50.cu b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tn_n.cu similarity index 100% rename from bench/device/simt_minimum_multiplies_dsrgemm_tn_n_sm50.cu rename to bench/device/sm50_simt_minimum_multiplies_dsrgemm_tn_n.cu diff --git a/bench/device/simt_minimum_multiplies_dsrgemm_tn_t_sm50.cu b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tn_t.cu similarity index 100% rename from bench/device/simt_minimum_multiplies_dsrgemm_tn_t_sm50.cu rename to bench/device/sm50_simt_minimum_multiplies_dsrgemm_tn_t.cu diff --git a/bench/device/simt_minimum_multiplies_dsrgemm_tt_n_sm50.cu b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tt_n.cu similarity index 100% rename from bench/device/simt_minimum_multiplies_dsrgemm_tt_n_sm50.cu rename to bench/device/sm50_simt_minimum_multiplies_dsrgemm_tt_n.cu diff --git a/bench/device/simt_minimum_multiplies_dsrgemm_tt_t_sm50.cu b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tt_t.cu similarity index 100% rename from bench/device/simt_minimum_multiplies_dsrgemm_tt_t_sm50.cu rename to bench/device/sm50_simt_minimum_multiplies_dsrgemm_tt_t.cu diff --git a/bench/device/simt_minimum_multiplies_ssrgemm_nn_n_sm50.cu b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nn_n.cu similarity index 100% rename from bench/device/simt_minimum_multiplies_ssrgemm_nn_n_sm50.cu rename to bench/device/sm50_simt_minimum_multiplies_ssrgemm_nn_n.cu diff --git a/bench/device/simt_minimum_multiplies_ssrgemm_nn_t_sm50.cu b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nn_t.cu similarity index 100% rename from bench/device/simt_minimum_multiplies_ssrgemm_nn_t_sm50.cu rename to bench/device/sm50_simt_minimum_multiplies_ssrgemm_nn_t.cu diff --git a/bench/device/simt_minimum_multiplies_ssrgemm_nt_n_sm50.cu b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nt_n.cu similarity index 100% rename from bench/device/simt_minimum_multiplies_ssrgemm_nt_n_sm50.cu rename to bench/device/sm50_simt_minimum_multiplies_ssrgemm_nt_n.cu diff --git a/bench/device/simt_minimum_multiplies_ssrgemm_nt_t_sm50.cu b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nt_t.cu similarity index 100% rename from bench/device/simt_minimum_multiplies_ssrgemm_nt_t_sm50.cu rename to bench/device/sm50_simt_minimum_multiplies_ssrgemm_nt_t.cu diff --git a/bench/device/simt_minimum_multiplies_ssrgemm_tn_n_sm50.cu b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tn_n.cu similarity index 100% rename from bench/device/simt_minimum_multiplies_ssrgemm_tn_n_sm50.cu rename to bench/device/sm50_simt_minimum_multiplies_ssrgemm_tn_n.cu diff --git a/bench/device/simt_minimum_multiplies_ssrgemm_tn_t_sm50.cu b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tn_t.cu similarity index 100% rename from bench/device/simt_minimum_multiplies_ssrgemm_tn_t_sm50.cu rename to bench/device/sm50_simt_minimum_multiplies_ssrgemm_tn_t.cu diff --git a/bench/device/simt_minimum_multiplies_ssrgemm_tt_n_sm50.cu b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tt_n.cu similarity index 100% rename from bench/device/simt_minimum_multiplies_ssrgemm_tt_n_sm50.cu rename to bench/device/sm50_simt_minimum_multiplies_ssrgemm_tt_n.cu diff --git a/bench/device/simt_minimum_multiplies_ssrgemm_tt_t_sm50.cu b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tt_t.cu similarity index 100% rename from bench/device/simt_minimum_multiplies_ssrgemm_tt_t_sm50.cu rename to bench/device/sm50_simt_minimum_multiplies_ssrgemm_tt_t.cu diff --git a/bench/device/simt_minimum_plus_dsrgemm_nn_n_sm50.cu b/bench/device/sm50_simt_minimum_plus_dsrgemm_nn_n.cu similarity index 100% rename from bench/device/simt_minimum_plus_dsrgemm_nn_n_sm50.cu rename to bench/device/sm50_simt_minimum_plus_dsrgemm_nn_n.cu diff --git a/bench/device/simt_minimum_plus_dsrgemm_nn_t_sm50.cu b/bench/device/sm50_simt_minimum_plus_dsrgemm_nn_t.cu similarity index 100% rename from bench/device/simt_minimum_plus_dsrgemm_nn_t_sm50.cu rename to bench/device/sm50_simt_minimum_plus_dsrgemm_nn_t.cu diff --git a/bench/device/simt_minimum_plus_dsrgemm_nt_n_sm50.cu b/bench/device/sm50_simt_minimum_plus_dsrgemm_nt_n.cu similarity index 100% rename from bench/device/simt_minimum_plus_dsrgemm_nt_n_sm50.cu rename to bench/device/sm50_simt_minimum_plus_dsrgemm_nt_n.cu diff --git a/bench/device/simt_minimum_plus_dsrgemm_nt_t_sm50.cu b/bench/device/sm50_simt_minimum_plus_dsrgemm_nt_t.cu similarity index 100% rename from bench/device/simt_minimum_plus_dsrgemm_nt_t_sm50.cu rename to bench/device/sm50_simt_minimum_plus_dsrgemm_nt_t.cu diff --git a/bench/device/simt_minimum_plus_dsrgemm_tn_n_sm50.cu b/bench/device/sm50_simt_minimum_plus_dsrgemm_tn_n.cu similarity index 100% rename from bench/device/simt_minimum_plus_dsrgemm_tn_n_sm50.cu rename to bench/device/sm50_simt_minimum_plus_dsrgemm_tn_n.cu diff --git a/bench/device/simt_minimum_plus_dsrgemm_tn_t_sm50.cu b/bench/device/sm50_simt_minimum_plus_dsrgemm_tn_t.cu similarity index 100% rename from bench/device/simt_minimum_plus_dsrgemm_tn_t_sm50.cu rename to bench/device/sm50_simt_minimum_plus_dsrgemm_tn_t.cu diff --git a/bench/device/simt_minimum_plus_dsrgemm_tt_n_sm50.cu b/bench/device/sm50_simt_minimum_plus_dsrgemm_tt_n.cu similarity index 100% rename from bench/device/simt_minimum_plus_dsrgemm_tt_n_sm50.cu rename to bench/device/sm50_simt_minimum_plus_dsrgemm_tt_n.cu diff --git a/bench/device/simt_minimum_plus_dsrgemm_tt_t_sm50.cu b/bench/device/sm50_simt_minimum_plus_dsrgemm_tt_t.cu similarity index 100% rename from bench/device/simt_minimum_plus_dsrgemm_tt_t_sm50.cu rename to bench/device/sm50_simt_minimum_plus_dsrgemm_tt_t.cu diff --git a/bench/device/simt_minimum_plus_ssrgemm_nn_n_sm50.cu b/bench/device/sm50_simt_minimum_plus_ssrgemm_nn_n.cu similarity index 100% rename from bench/device/simt_minimum_plus_ssrgemm_nn_n_sm50.cu rename to bench/device/sm50_simt_minimum_plus_ssrgemm_nn_n.cu diff --git a/bench/device/simt_minimum_plus_ssrgemm_nn_t_sm50.cu b/bench/device/sm50_simt_minimum_plus_ssrgemm_nn_t.cu similarity index 100% rename from bench/device/simt_minimum_plus_ssrgemm_nn_t_sm50.cu rename to bench/device/sm50_simt_minimum_plus_ssrgemm_nn_t.cu diff --git a/bench/device/simt_minimum_plus_ssrgemm_nt_n_sm50.cu b/bench/device/sm50_simt_minimum_plus_ssrgemm_nt_n.cu similarity index 100% rename from bench/device/simt_minimum_plus_ssrgemm_nt_n_sm50.cu rename to bench/device/sm50_simt_minimum_plus_ssrgemm_nt_n.cu diff --git a/bench/device/simt_minimum_plus_ssrgemm_nt_t_sm50.cu b/bench/device/sm50_simt_minimum_plus_ssrgemm_nt_t.cu similarity index 100% rename from bench/device/simt_minimum_plus_ssrgemm_nt_t_sm50.cu rename to bench/device/sm50_simt_minimum_plus_ssrgemm_nt_t.cu diff --git a/bench/device/simt_minimum_plus_ssrgemm_tn_n_sm50.cu b/bench/device/sm50_simt_minimum_plus_ssrgemm_tn_n.cu similarity index 100% rename from bench/device/simt_minimum_plus_ssrgemm_tn_n_sm50.cu rename to bench/device/sm50_simt_minimum_plus_ssrgemm_tn_n.cu diff --git a/bench/device/simt_minimum_plus_ssrgemm_tn_t_sm50.cu b/bench/device/sm50_simt_minimum_plus_ssrgemm_tn_t.cu similarity index 100% rename from bench/device/simt_minimum_plus_ssrgemm_tn_t_sm50.cu rename to bench/device/sm50_simt_minimum_plus_ssrgemm_tn_t.cu diff --git a/bench/device/simt_minimum_plus_ssrgemm_tt_n_sm50.cu b/bench/device/sm50_simt_minimum_plus_ssrgemm_tt_n.cu similarity index 100% rename from bench/device/simt_minimum_plus_ssrgemm_tt_n_sm50.cu rename to bench/device/sm50_simt_minimum_plus_ssrgemm_tt_n.cu diff --git a/bench/device/simt_minimum_plus_ssrgemm_tt_t_sm50.cu b/bench/device/sm50_simt_minimum_plus_ssrgemm_tt_t.cu similarity index 100% rename from bench/device/simt_minimum_plus_ssrgemm_tt_t_sm50.cu rename to bench/device/sm50_simt_minimum_plus_ssrgemm_tt_t.cu diff --git a/bench/device/simt_plus_multiplies_dsrgemm_nn_n_sm50.cu b/bench/device/sm50_simt_plus_multiplies_dsrgemm_nn_n.cu similarity index 100% rename from bench/device/simt_plus_multiplies_dsrgemm_nn_n_sm50.cu rename to bench/device/sm50_simt_plus_multiplies_dsrgemm_nn_n.cu diff --git a/bench/device/simt_plus_multiplies_dsrgemm_nn_t_sm50.cu b/bench/device/sm50_simt_plus_multiplies_dsrgemm_nn_t.cu similarity index 100% rename from bench/device/simt_plus_multiplies_dsrgemm_nn_t_sm50.cu rename to bench/device/sm50_simt_plus_multiplies_dsrgemm_nn_t.cu diff --git a/bench/device/simt_plus_multiplies_dsrgemm_nt_n_sm50.cu b/bench/device/sm50_simt_plus_multiplies_dsrgemm_nt_n.cu similarity index 100% rename from bench/device/simt_plus_multiplies_dsrgemm_nt_n_sm50.cu rename to bench/device/sm50_simt_plus_multiplies_dsrgemm_nt_n.cu diff --git a/bench/device/simt_plus_multiplies_dsrgemm_nt_t_sm50.cu b/bench/device/sm50_simt_plus_multiplies_dsrgemm_nt_t.cu similarity index 100% rename from bench/device/simt_plus_multiplies_dsrgemm_nt_t_sm50.cu rename to bench/device/sm50_simt_plus_multiplies_dsrgemm_nt_t.cu diff --git a/bench/device/simt_plus_multiplies_dsrgemm_tn_n_sm50.cu b/bench/device/sm50_simt_plus_multiplies_dsrgemm_tn_n.cu similarity index 100% rename from bench/device/simt_plus_multiplies_dsrgemm_tn_n_sm50.cu rename to bench/device/sm50_simt_plus_multiplies_dsrgemm_tn_n.cu diff --git a/bench/device/simt_plus_multiplies_dsrgemm_tn_t_sm50.cu b/bench/device/sm50_simt_plus_multiplies_dsrgemm_tn_t.cu similarity index 100% rename from bench/device/simt_plus_multiplies_dsrgemm_tn_t_sm50.cu rename to bench/device/sm50_simt_plus_multiplies_dsrgemm_tn_t.cu diff --git a/bench/device/simt_plus_multiplies_dsrgemm_tt_n_sm50.cu b/bench/device/sm50_simt_plus_multiplies_dsrgemm_tt_n.cu similarity index 100% rename from bench/device/simt_plus_multiplies_dsrgemm_tt_n_sm50.cu rename to bench/device/sm50_simt_plus_multiplies_dsrgemm_tt_n.cu diff --git a/bench/device/simt_plus_multiplies_dsrgemm_tt_t_sm50.cu b/bench/device/sm50_simt_plus_multiplies_dsrgemm_tt_t.cu similarity index 100% rename from bench/device/simt_plus_multiplies_dsrgemm_tt_t_sm50.cu rename to bench/device/sm50_simt_plus_multiplies_dsrgemm_tt_t.cu diff --git a/bench/device/simt_plus_multiplies_ssrgemm_nn_n_sm50.cu b/bench/device/sm50_simt_plus_multiplies_ssrgemm_nn_n.cu similarity index 100% rename from bench/device/simt_plus_multiplies_ssrgemm_nn_n_sm50.cu rename to bench/device/sm50_simt_plus_multiplies_ssrgemm_nn_n.cu diff --git a/bench/device/simt_plus_multiplies_ssrgemm_nn_t_sm50.cu b/bench/device/sm50_simt_plus_multiplies_ssrgemm_nn_t.cu similarity index 100% rename from bench/device/simt_plus_multiplies_ssrgemm_nn_t_sm50.cu rename to bench/device/sm50_simt_plus_multiplies_ssrgemm_nn_t.cu diff --git a/bench/device/simt_plus_multiplies_ssrgemm_nt_n_sm50.cu b/bench/device/sm50_simt_plus_multiplies_ssrgemm_nt_n.cu similarity index 100% rename from bench/device/simt_plus_multiplies_ssrgemm_nt_n_sm50.cu rename to bench/device/sm50_simt_plus_multiplies_ssrgemm_nt_n.cu diff --git a/bench/device/simt_plus_multiplies_ssrgemm_nt_t_sm50.cu b/bench/device/sm50_simt_plus_multiplies_ssrgemm_nt_t.cu similarity index 100% rename from bench/device/simt_plus_multiplies_ssrgemm_nt_t_sm50.cu rename to bench/device/sm50_simt_plus_multiplies_ssrgemm_nt_t.cu diff --git a/bench/device/simt_plus_multiplies_ssrgemm_tn_n_sm50.cu b/bench/device/sm50_simt_plus_multiplies_ssrgemm_tn_n.cu similarity index 100% rename from bench/device/simt_plus_multiplies_ssrgemm_tn_n_sm50.cu rename to bench/device/sm50_simt_plus_multiplies_ssrgemm_tn_n.cu diff --git a/bench/device/simt_plus_multiplies_ssrgemm_tn_t_sm50.cu b/bench/device/sm50_simt_plus_multiplies_ssrgemm_tn_t.cu similarity index 100% rename from bench/device/simt_plus_multiplies_ssrgemm_tn_t_sm50.cu rename to bench/device/sm50_simt_plus_multiplies_ssrgemm_tn_t.cu diff --git a/bench/device/simt_plus_multiplies_ssrgemm_tt_n_sm50.cu b/bench/device/sm50_simt_plus_multiplies_ssrgemm_tt_n.cu similarity index 100% rename from bench/device/simt_plus_multiplies_ssrgemm_tt_n_sm50.cu rename to bench/device/sm50_simt_plus_multiplies_ssrgemm_tt_n.cu diff --git a/bench/device/simt_plus_multiplies_ssrgemm_tt_t_sm50.cu b/bench/device/sm50_simt_plus_multiplies_ssrgemm_tt_t.cu similarity index 100% rename from bench/device/simt_plus_multiplies_ssrgemm_tt_t_sm50.cu rename to bench/device/sm50_simt_plus_multiplies_ssrgemm_tt_t.cu From a40f7bc3dc5eebb2ce825626c4c0dff8cee7fd48 Mon Sep 17 00:00:00 2001 From: Void Date: Sun, 31 Oct 2021 14:52:12 -0400 Subject: [PATCH 07/15] add benchmark generator, generated code, cmake file for default configs --- bench/device/CMakeLists.txt | 29 +- bench/device/gen_default_bench.py | 174 ++ bench/device/sm50_defaults.cu | 4366 +++++++++++++++++++++++++++++ 3 files changed, 4564 insertions(+), 5 deletions(-) create mode 100644 bench/device/gen_default_bench.py create mode 100644 bench/device/sm50_defaults.cu diff --git a/bench/device/CMakeLists.txt b/bench/device/CMakeLists.txt index c1d1183..ef85505 100644 --- a/bench/device/CMakeLists.txt +++ b/bench/device/CMakeLists.txt @@ -1,16 +1,35 @@ -file(GLOB SIMT_BENCH_SRCS CONFIGURE_DEPENDS *.cu) -add_executable(cuasr_bench_srgemm_device +# Just the default configurations +add_executable(cuasr_bench_srgemm_device_defaults + sm50_defaults.cu +) +target_include_directories( + cuasr_bench_srgemm_device_defaults + PRIVATE + ${PROJECT_SOURCE_DIR}/include/ + ${PROJECT_SOURCE_DIR}/tools/include/ + ${PROJECT_SOURCE_DIR}/cutlass/include/ + ${PROJECT_SOURCE_DIR}/cutlass/tools/util/include/ +) +target_link_libraries(cuasr_bench_srgemm_device_defaults + benchmark + benchmark_main + ${cuASR_LIB_NAME} +) + +# All shmoo benchmarks +file(GLOB SIMT_BENCH_SRCS CONFIGURE_DEPENDS sm50_simt_*.cu) +add_executable(cuasr_bench_srgemm_device_shmoo ${SIMT_BENCH_SRCS} ) target_include_directories( - cuasr_bench_srgemm_device + cuasr_bench_srgemm_device_shmoo PRIVATE ${PROJECT_SOURCE_DIR}/include/ ${PROJECT_SOURCE_DIR}/tools/include/ ${PROJECT_SOURCE_DIR}/cutlass/include/ ${PROJECT_SOURCE_DIR}/cutlass/tools/util/include/ ) -target_link_libraries(cuasr_bench_srgemm_device +target_link_libraries(cuasr_bench_srgemm_device_shmoo benchmark benchmark_main ${cuASR_LIB_NAME} @@ -18,6 +37,6 @@ target_link_libraries(cuasr_bench_srgemm_device if(NOT DEFINED CUASR_BENCH_LEVEL) set(CUASR_BENCH_LEVEL 0) endif() -target_compile_definitions(cuasr_bench_srgemm_device +target_compile_definitions(cuasr_bench_srgemm_device_shmoo PRIVATE CUASR_BENCH_LEVEL=${CUASR_BENCH_LEVEL} ) diff --git a/bench/device/gen_default_bench.py b/bench/device/gen_default_bench.py new file mode 100644 index 0000000..9465f87 --- /dev/null +++ b/bench/device/gen_default_bench.py @@ -0,0 +1,174 @@ +import os +import sys +import argparse + +################################################################################ +# This file creates all the possible semiring-gemm kernels for all transposes +# using just the defualt SRGEMM configurations for them. +################################################################################ + +precisions = [ + ["d", "double"], + ["s", "float"], +] + +transposes = [ + [False, False, True], + [False, False, False], + [False, True, True], + [False, True, False], + [True, False, True], + [True, False, False], + [True, True, True], + [True, True, False], +] + +semiring_operators = [ + ["plus", "multiplies"], # regular GEMM + ["minimum", "plus"], # min-plus (tropical) + ["maximum", "plus"], # max-plus + ["minimum", "maximum"], # min-max + ["maximum", "minimum"], # max-min + ["minimum", "multiplies"], # min-multiplies + ["maximum", "multiplies"], # max-multiplies + ["binary_or", "binary_and"] # or-and +] + +benchfile_header = """\ +/*************************************************************************************************** +* Copyright (c) 2021, Vijay Thakkar (thakkarv@gatech.edu). +**************************************************************************************************/ +////////////////////////////////////////////////////////////////////// +// THIS BENCHMARK FILE IS GENERATED AUTOMATICALLY : DO NOT MODIFY // +////////////////////////////////////////////////////////////////////// + +#include "benchmark/benchmark.h" + +#include "cuasr/gemm/device/default_srgemm_configuration.h" +#include "cuasr/gemm/device/srgemm.h" +#include "cuasr/functional.h" + +#include "harness.h" +""" + +bench_template = """\ + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM{sm_arch}_device_{add_op}_{mult_op}_{precision_char}srgemm_{transA}{transB}_{transC}(benchmark::State &state) {{ + const auto N = static_cast(state.range(0)); + using precision = {precision_type}; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm{sm_arch}; + + using AddOp = cuasr::{add_op}; + using MultOp = cuasr::{mult_op}; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::{trans_typeA}Major, // + precision, cutlass::layout::{trans_typeB}Major, // + precision, cutlass::layout::{trans_typeC}Major, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({{ N, N, N }}); + + // benchmark loop + for (auto _ : state) {{ + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + }} + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +}} +BENCHMARK(BM_SM{sm_arch}_device_{add_op}_{mult_op}_{precision_char}srgemm_{transA}{transB}_{transC}) + ->RangeMultiplier(2)->Range(256, 4096); +""" + + +def write_benchmark_file_header(benchfile): + benchfile.write(benchfile_header) + + +def write_benchmark_to_file( + benchfile, + sm_arch, + add_op, + mult_op, + precision_char, + precision_type, + transA, + transB, + transC): + trans_typeA = "Column" if transA == "n" else "Row" + trans_typeB = "Column" if transB == "n" else "Row" + trans_typeC = "Column" if transC == "n" else "Row" + benchfile.write(bench_template.format( + sm_arch=sm_arch, + add_op=add_op, + mult_op=mult_op, + precision_char=precision_char, + precision_type=precision_type, + transA=transA, + transB=transB, + transC=transC, + trans_typeA=trans_typeA, + trans_typeB=trans_typeB, + trans_typeC=trans_typeC + )) + + +def main(args): + num_benches = 0 + benchfile_name = "sm{}_defaults.cu".format(args.sm_arch) + print(benchfile_name) + filePath = os.path.join(args.output_dir, benchfile_name) + + # open file and gen all default tests + with open(filePath, "w") as benchfile: + write_benchmark_file_header(benchfile) + + # for all semirings + for add_op, mult_op in semiring_operators: + # for all precisions + for precision in precisions: + precision_char = precision[0] + precision_type = precision[1] + + # transposes + for transpose in transposes: + # get transpose char + column_major_A = transpose[0] + column_major_B = transpose[1] + column_major_C = transpose[2] + transA = "n" if column_major_A else "t" + transB = "n" if column_major_B else "t" + transC = "n" if column_major_C else "t" + + # write to file + write_benchmark_to_file( + benchfile, + args.sm_arch, + add_op, + mult_op, + precision_char, + precision_type, + transA, + transB, + transC) + num_benches += 1 + print("Total bench count per semi-ring = {}".format( + num_benches // len(semiring_operators))) + + +if __name__ == "__main__": + parser = argparse.ArgumentParser() + parser.add_argument("-o", "--output-dir", type=str, required=False, default=".", + help="Path to the output dir.") + parser.add_argument("-sm", "--sm-arch", type=int, required=False, default=50, choices=[50, 80], + help="SM architecture version number,") + args = parser.parse_args(sys.argv[1:]) + main(args) diff --git a/bench/device/sm50_defaults.cu b/bench/device/sm50_defaults.cu new file mode 100644 index 0000000..eddb201 --- /dev/null +++ b/bench/device/sm50_defaults.cu @@ -0,0 +1,4366 @@ +/*************************************************************************************************** +* Copyright (c) 2021, Vijay Thakkar (thakkarv@gatech.edu). +**************************************************************************************************/ +////////////////////////////////////////////////////////////////////// +// THIS BENCHMARK FILE IS GENERATED AUTOMATICALLY : DO NOT MODIFY // +////////////////////////////////////////////////////////////////////// + +#include "benchmark/benchmark.h" + +#include "cuasr/gemm/device/default_srgemm_configuration.h" +#include "cuasr/gemm/device/srgemm.h" +#include "cuasr/functional.h" + +#include "harness.h" + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_plus_multiplies_dsrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_plus_multiplies_dsrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_plus_multiplies_dsrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_plus_multiplies_dsrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_plus_multiplies_dsrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_plus_multiplies_dsrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_plus_multiplies_dsrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_plus_multiplies_dsrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_plus_multiplies_ssrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_plus_multiplies_ssrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_plus_multiplies_ssrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_plus_multiplies_ssrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_plus_multiplies_ssrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_plus_multiplies_ssrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_plus_multiplies_ssrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_plus_multiplies_ssrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_plus_dsrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_plus_dsrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_plus_dsrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_plus_dsrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_plus_dsrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_plus_dsrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_plus_dsrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_plus_dsrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_plus_dsrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_plus_dsrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_plus_dsrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_plus_dsrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_plus_dsrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_plus_dsrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_plus_dsrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_plus_dsrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_plus_ssrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_plus_ssrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_plus_ssrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_plus_ssrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_plus_ssrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_plus_ssrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_plus_ssrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_plus_ssrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_plus_ssrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_plus_ssrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_plus_ssrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_plus_ssrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_plus_ssrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_plus_ssrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_plus_ssrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_plus_ssrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_plus_dsrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_plus_dsrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_plus_dsrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_plus_dsrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_plus_dsrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_plus_dsrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_plus_dsrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_plus_dsrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_plus_dsrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_plus_dsrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_plus_dsrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_plus_dsrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_plus_dsrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_plus_dsrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_plus_dsrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_plus_dsrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_plus_ssrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_plus_ssrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_plus_ssrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_plus_ssrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_plus_ssrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_plus_ssrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_plus_ssrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_plus_ssrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_plus_ssrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_plus_ssrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_plus_ssrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_plus_ssrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_plus_ssrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_plus_ssrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_plus_ssrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_plus_ssrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_maximum_dsrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_maximum_dsrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_maximum_dsrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_maximum_dsrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_maximum_dsrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_maximum_dsrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_maximum_dsrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_maximum_dsrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_maximum_ssrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_maximum_ssrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_maximum_ssrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_maximum_ssrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_maximum_ssrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_maximum_ssrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_maximum_ssrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_maximum_ssrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_minimum_dsrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_minimum_dsrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_minimum_dsrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_minimum_dsrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_minimum_dsrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_minimum_dsrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_minimum_dsrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_minimum_dsrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_minimum_ssrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_minimum_ssrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_minimum_ssrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_minimum_ssrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_minimum_ssrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_minimum_ssrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_minimum_ssrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_minimum_ssrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_multiplies_dsrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_multiplies_dsrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_multiplies_dsrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_multiplies_dsrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_multiplies_dsrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_multiplies_dsrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_multiplies_dsrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_multiplies_dsrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_multiplies_ssrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_multiplies_ssrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_multiplies_ssrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_multiplies_ssrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_multiplies_ssrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_multiplies_ssrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_multiplies_ssrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_minimum_multiplies_ssrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_multiplies_dsrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_multiplies_dsrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_multiplies_dsrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_multiplies_dsrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_multiplies_dsrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_multiplies_dsrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_multiplies_dsrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_multiplies_dsrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_multiplies_ssrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_multiplies_ssrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_multiplies_ssrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_multiplies_ssrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_multiplies_ssrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_multiplies_ssrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_multiplies_ssrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_maximum_multiplies_ssrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); From 2c6fa5e837f9766175c5a331be0d4f09315776b1 Mon Sep 17 00:00:00 2001 From: Void Date: Mon, 1 Nov 2021 11:47:35 -0400 Subject: [PATCH 08/15] rework DefualtSemiRingConfiguration struct API for clarity --- bench/device/gen_simt.py | 6 +- ..._simt_binary_or_binary_and_dsrgemm_nn_n.cu | 216 +++++------ ..._simt_binary_or_binary_and_dsrgemm_nn_t.cu | 216 +++++------ ..._simt_binary_or_binary_and_dsrgemm_nt_n.cu | 216 +++++------ ..._simt_binary_or_binary_and_dsrgemm_nt_t.cu | 216 +++++------ ..._simt_binary_or_binary_and_dsrgemm_tn_n.cu | 216 +++++------ ..._simt_binary_or_binary_and_dsrgemm_tn_t.cu | 216 +++++------ ..._simt_binary_or_binary_and_dsrgemm_tt_n.cu | 216 +++++------ ..._simt_binary_or_binary_and_dsrgemm_tt_t.cu | 216 +++++------ ..._simt_binary_or_binary_and_ssrgemm_nn_n.cu | 342 +++++++++--------- ..._simt_binary_or_binary_and_ssrgemm_nn_t.cu | 342 +++++++++--------- ..._simt_binary_or_binary_and_ssrgemm_nt_n.cu | 342 +++++++++--------- ..._simt_binary_or_binary_and_ssrgemm_nt_t.cu | 342 +++++++++--------- ..._simt_binary_or_binary_and_ssrgemm_tn_n.cu | 342 +++++++++--------- ..._simt_binary_or_binary_and_ssrgemm_tn_t.cu | 342 +++++++++--------- ..._simt_binary_or_binary_and_ssrgemm_tt_n.cu | 342 +++++++++--------- ..._simt_binary_or_binary_and_ssrgemm_tt_t.cu | 342 +++++++++--------- .../sm50_simt_maximum_minimum_dsrgemm_nn_n.cu | 216 +++++------ .../sm50_simt_maximum_minimum_dsrgemm_nn_t.cu | 216 +++++------ .../sm50_simt_maximum_minimum_dsrgemm_nt_n.cu | 216 +++++------ .../sm50_simt_maximum_minimum_dsrgemm_nt_t.cu | 216 +++++------ .../sm50_simt_maximum_minimum_dsrgemm_tn_n.cu | 216 +++++------ .../sm50_simt_maximum_minimum_dsrgemm_tn_t.cu | 216 +++++------ .../sm50_simt_maximum_minimum_dsrgemm_tt_n.cu | 216 +++++------ .../sm50_simt_maximum_minimum_dsrgemm_tt_t.cu | 216 +++++------ .../sm50_simt_maximum_minimum_ssrgemm_nn_n.cu | 342 +++++++++--------- .../sm50_simt_maximum_minimum_ssrgemm_nn_t.cu | 342 +++++++++--------- .../sm50_simt_maximum_minimum_ssrgemm_nt_n.cu | 342 +++++++++--------- .../sm50_simt_maximum_minimum_ssrgemm_nt_t.cu | 342 +++++++++--------- .../sm50_simt_maximum_minimum_ssrgemm_tn_n.cu | 342 +++++++++--------- .../sm50_simt_maximum_minimum_ssrgemm_tn_t.cu | 342 +++++++++--------- .../sm50_simt_maximum_minimum_ssrgemm_tt_n.cu | 342 +++++++++--------- .../sm50_simt_maximum_minimum_ssrgemm_tt_t.cu | 342 +++++++++--------- ...50_simt_maximum_multiplies_dsrgemm_nn_n.cu | 216 +++++------ ...50_simt_maximum_multiplies_dsrgemm_nn_t.cu | 216 +++++------ ...50_simt_maximum_multiplies_dsrgemm_nt_n.cu | 216 +++++------ ...50_simt_maximum_multiplies_dsrgemm_nt_t.cu | 216 +++++------ ...50_simt_maximum_multiplies_dsrgemm_tn_n.cu | 216 +++++------ ...50_simt_maximum_multiplies_dsrgemm_tn_t.cu | 216 +++++------ ...50_simt_maximum_multiplies_dsrgemm_tt_n.cu | 216 +++++------ ...50_simt_maximum_multiplies_dsrgemm_tt_t.cu | 216 +++++------ ...50_simt_maximum_multiplies_ssrgemm_nn_n.cu | 342 +++++++++--------- ...50_simt_maximum_multiplies_ssrgemm_nn_t.cu | 342 +++++++++--------- ...50_simt_maximum_multiplies_ssrgemm_nt_n.cu | 342 +++++++++--------- ...50_simt_maximum_multiplies_ssrgemm_nt_t.cu | 342 +++++++++--------- ...50_simt_maximum_multiplies_ssrgemm_tn_n.cu | 342 +++++++++--------- ...50_simt_maximum_multiplies_ssrgemm_tn_t.cu | 342 +++++++++--------- ...50_simt_maximum_multiplies_ssrgemm_tt_n.cu | 342 +++++++++--------- ...50_simt_maximum_multiplies_ssrgemm_tt_t.cu | 342 +++++++++--------- .../sm50_simt_maximum_plus_dsrgemm_nn_n.cu | 216 +++++------ .../sm50_simt_maximum_plus_dsrgemm_nn_t.cu | 216 +++++------ .../sm50_simt_maximum_plus_dsrgemm_nt_n.cu | 216 +++++------ .../sm50_simt_maximum_plus_dsrgemm_nt_t.cu | 216 +++++------ .../sm50_simt_maximum_plus_dsrgemm_tn_n.cu | 216 +++++------ .../sm50_simt_maximum_plus_dsrgemm_tn_t.cu | 216 +++++------ .../sm50_simt_maximum_plus_dsrgemm_tt_n.cu | 216 +++++------ .../sm50_simt_maximum_plus_dsrgemm_tt_t.cu | 216 +++++------ .../sm50_simt_maximum_plus_ssrgemm_nn_n.cu | 342 +++++++++--------- .../sm50_simt_maximum_plus_ssrgemm_nn_t.cu | 342 +++++++++--------- .../sm50_simt_maximum_plus_ssrgemm_nt_n.cu | 342 +++++++++--------- .../sm50_simt_maximum_plus_ssrgemm_nt_t.cu | 342 +++++++++--------- .../sm50_simt_maximum_plus_ssrgemm_tn_n.cu | 342 +++++++++--------- .../sm50_simt_maximum_plus_ssrgemm_tn_t.cu | 342 +++++++++--------- .../sm50_simt_maximum_plus_ssrgemm_tt_n.cu | 342 +++++++++--------- .../sm50_simt_maximum_plus_ssrgemm_tt_t.cu | 342 +++++++++--------- .../sm50_simt_minimum_maximum_dsrgemm_nn_n.cu | 216 +++++------ .../sm50_simt_minimum_maximum_dsrgemm_nn_t.cu | 216 +++++------ .../sm50_simt_minimum_maximum_dsrgemm_nt_n.cu | 216 +++++------ .../sm50_simt_minimum_maximum_dsrgemm_nt_t.cu | 216 +++++------ .../sm50_simt_minimum_maximum_dsrgemm_tn_n.cu | 216 +++++------ .../sm50_simt_minimum_maximum_dsrgemm_tn_t.cu | 216 +++++------ .../sm50_simt_minimum_maximum_dsrgemm_tt_n.cu | 216 +++++------ .../sm50_simt_minimum_maximum_dsrgemm_tt_t.cu | 216 +++++------ .../sm50_simt_minimum_maximum_ssrgemm_nn_n.cu | 342 +++++++++--------- .../sm50_simt_minimum_maximum_ssrgemm_nn_t.cu | 342 +++++++++--------- .../sm50_simt_minimum_maximum_ssrgemm_nt_n.cu | 342 +++++++++--------- .../sm50_simt_minimum_maximum_ssrgemm_nt_t.cu | 342 +++++++++--------- .../sm50_simt_minimum_maximum_ssrgemm_tn_n.cu | 342 +++++++++--------- .../sm50_simt_minimum_maximum_ssrgemm_tn_t.cu | 342 +++++++++--------- .../sm50_simt_minimum_maximum_ssrgemm_tt_n.cu | 342 +++++++++--------- .../sm50_simt_minimum_maximum_ssrgemm_tt_t.cu | 342 +++++++++--------- ...50_simt_minimum_multiplies_dsrgemm_nn_n.cu | 216 +++++------ ...50_simt_minimum_multiplies_dsrgemm_nn_t.cu | 216 +++++------ ...50_simt_minimum_multiplies_dsrgemm_nt_n.cu | 216 +++++------ ...50_simt_minimum_multiplies_dsrgemm_nt_t.cu | 216 +++++------ ...50_simt_minimum_multiplies_dsrgemm_tn_n.cu | 216 +++++------ ...50_simt_minimum_multiplies_dsrgemm_tn_t.cu | 216 +++++------ ...50_simt_minimum_multiplies_dsrgemm_tt_n.cu | 216 +++++------ ...50_simt_minimum_multiplies_dsrgemm_tt_t.cu | 216 +++++------ ...50_simt_minimum_multiplies_ssrgemm_nn_n.cu | 342 +++++++++--------- ...50_simt_minimum_multiplies_ssrgemm_nn_t.cu | 342 +++++++++--------- ...50_simt_minimum_multiplies_ssrgemm_nt_n.cu | 342 +++++++++--------- ...50_simt_minimum_multiplies_ssrgemm_nt_t.cu | 342 +++++++++--------- ...50_simt_minimum_multiplies_ssrgemm_tn_n.cu | 342 +++++++++--------- ...50_simt_minimum_multiplies_ssrgemm_tn_t.cu | 342 +++++++++--------- ...50_simt_minimum_multiplies_ssrgemm_tt_n.cu | 342 +++++++++--------- ...50_simt_minimum_multiplies_ssrgemm_tt_t.cu | 342 +++++++++--------- .../sm50_simt_minimum_plus_dsrgemm_nn_n.cu | 216 +++++------ .../sm50_simt_minimum_plus_dsrgemm_nn_t.cu | 216 +++++------ .../sm50_simt_minimum_plus_dsrgemm_nt_n.cu | 216 +++++------ .../sm50_simt_minimum_plus_dsrgemm_nt_t.cu | 216 +++++------ .../sm50_simt_minimum_plus_dsrgemm_tn_n.cu | 216 +++++------ .../sm50_simt_minimum_plus_dsrgemm_tn_t.cu | 216 +++++------ .../sm50_simt_minimum_plus_dsrgemm_tt_n.cu | 216 +++++------ .../sm50_simt_minimum_plus_dsrgemm_tt_t.cu | 216 +++++------ .../sm50_simt_minimum_plus_ssrgemm_nn_n.cu | 342 +++++++++--------- .../sm50_simt_minimum_plus_ssrgemm_nn_t.cu | 342 +++++++++--------- .../sm50_simt_minimum_plus_ssrgemm_nt_n.cu | 342 +++++++++--------- .../sm50_simt_minimum_plus_ssrgemm_nt_t.cu | 342 +++++++++--------- .../sm50_simt_minimum_plus_ssrgemm_tn_n.cu | 342 +++++++++--------- .../sm50_simt_minimum_plus_ssrgemm_tn_t.cu | 342 +++++++++--------- .../sm50_simt_minimum_plus_ssrgemm_tt_n.cu | 342 +++++++++--------- .../sm50_simt_minimum_plus_ssrgemm_tt_t.cu | 342 +++++++++--------- .../sm50_simt_plus_multiplies_dsrgemm_nn_n.cu | 216 +++++------ .../sm50_simt_plus_multiplies_dsrgemm_nn_t.cu | 216 +++++------ .../sm50_simt_plus_multiplies_dsrgemm_nt_n.cu | 216 +++++------ .../sm50_simt_plus_multiplies_dsrgemm_nt_t.cu | 216 +++++------ .../sm50_simt_plus_multiplies_dsrgemm_tn_n.cu | 216 +++++------ .../sm50_simt_plus_multiplies_dsrgemm_tn_t.cu | 216 +++++------ .../sm50_simt_plus_multiplies_dsrgemm_tt_n.cu | 216 +++++------ .../sm50_simt_plus_multiplies_dsrgemm_tt_t.cu | 216 +++++------ .../sm50_simt_plus_multiplies_ssrgemm_nn_n.cu | 342 +++++++++--------- .../sm50_simt_plus_multiplies_ssrgemm_nn_t.cu | 342 +++++++++--------- .../sm50_simt_plus_multiplies_ssrgemm_nt_n.cu | 342 +++++++++--------- .../sm50_simt_plus_multiplies_ssrgemm_nt_t.cu | 342 +++++++++--------- .../sm50_simt_plus_multiplies_ssrgemm_tn_n.cu | 342 +++++++++--------- .../sm50_simt_plus_multiplies_ssrgemm_tn_t.cu | 342 +++++++++--------- .../sm50_simt_plus_multiplies_ssrgemm_tt_n.cu | 342 +++++++++--------- .../sm50_simt_plus_multiplies_ssrgemm_tt_t.cu | 342 +++++++++--------- .../device/default_srgemm_configuration.h | 23 +- include/cuasr/gemm/device/srgemm.h | 14 +- .../gemm/device/srgemm_splitk_parallel.h | 16 +- test/device/gen_simt.py | 6 +- ..._simt_binary_or_binary_and_dsrgemm_nn_n.cu | 216 +++++------ ..._simt_binary_or_binary_and_dsrgemm_nn_t.cu | 216 +++++------ ..._simt_binary_or_binary_and_dsrgemm_nt_n.cu | 216 +++++------ ..._simt_binary_or_binary_and_dsrgemm_nt_t.cu | 216 +++++------ ..._simt_binary_or_binary_and_dsrgemm_tn_n.cu | 216 +++++------ ..._simt_binary_or_binary_and_dsrgemm_tn_t.cu | 216 +++++------ ..._simt_binary_or_binary_and_dsrgemm_tt_n.cu | 216 +++++------ ..._simt_binary_or_binary_and_dsrgemm_tt_t.cu | 216 +++++------ ..._simt_binary_or_binary_and_ssrgemm_nn_n.cu | 342 +++++++++--------- ..._simt_binary_or_binary_and_ssrgemm_nn_t.cu | 342 +++++++++--------- ..._simt_binary_or_binary_and_ssrgemm_nt_n.cu | 342 +++++++++--------- ..._simt_binary_or_binary_and_ssrgemm_nt_t.cu | 342 +++++++++--------- ..._simt_binary_or_binary_and_ssrgemm_tn_n.cu | 342 +++++++++--------- ..._simt_binary_or_binary_and_ssrgemm_tn_t.cu | 342 +++++++++--------- ..._simt_binary_or_binary_and_ssrgemm_tt_n.cu | 342 +++++++++--------- ..._simt_binary_or_binary_and_ssrgemm_tt_t.cu | 342 +++++++++--------- .../sm50_simt_maximum_minimum_dsrgemm_nn_n.cu | 216 +++++------ .../sm50_simt_maximum_minimum_dsrgemm_nn_t.cu | 216 +++++------ .../sm50_simt_maximum_minimum_dsrgemm_nt_n.cu | 216 +++++------ .../sm50_simt_maximum_minimum_dsrgemm_nt_t.cu | 216 +++++------ .../sm50_simt_maximum_minimum_dsrgemm_tn_n.cu | 216 +++++------ .../sm50_simt_maximum_minimum_dsrgemm_tn_t.cu | 216 +++++------ .../sm50_simt_maximum_minimum_dsrgemm_tt_n.cu | 216 +++++------ .../sm50_simt_maximum_minimum_dsrgemm_tt_t.cu | 216 +++++------ .../sm50_simt_maximum_minimum_ssrgemm_nn_n.cu | 342 +++++++++--------- .../sm50_simt_maximum_minimum_ssrgemm_nn_t.cu | 342 +++++++++--------- .../sm50_simt_maximum_minimum_ssrgemm_nt_n.cu | 342 +++++++++--------- .../sm50_simt_maximum_minimum_ssrgemm_nt_t.cu | 342 +++++++++--------- .../sm50_simt_maximum_minimum_ssrgemm_tn_n.cu | 342 +++++++++--------- .../sm50_simt_maximum_minimum_ssrgemm_tn_t.cu | 342 +++++++++--------- .../sm50_simt_maximum_minimum_ssrgemm_tt_n.cu | 342 +++++++++--------- .../sm50_simt_maximum_minimum_ssrgemm_tt_t.cu | 342 +++++++++--------- ...50_simt_maximum_multiplies_dsrgemm_nn_n.cu | 216 +++++------ ...50_simt_maximum_multiplies_dsrgemm_nn_t.cu | 216 +++++------ ...50_simt_maximum_multiplies_dsrgemm_nt_n.cu | 216 +++++------ ...50_simt_maximum_multiplies_dsrgemm_nt_t.cu | 216 +++++------ ...50_simt_maximum_multiplies_dsrgemm_tn_n.cu | 216 +++++------ ...50_simt_maximum_multiplies_dsrgemm_tn_t.cu | 216 +++++------ ...50_simt_maximum_multiplies_dsrgemm_tt_n.cu | 216 +++++------ ...50_simt_maximum_multiplies_dsrgemm_tt_t.cu | 216 +++++------ ...50_simt_maximum_multiplies_ssrgemm_nn_n.cu | 342 +++++++++--------- ...50_simt_maximum_multiplies_ssrgemm_nn_t.cu | 342 +++++++++--------- ...50_simt_maximum_multiplies_ssrgemm_nt_n.cu | 342 +++++++++--------- ...50_simt_maximum_multiplies_ssrgemm_nt_t.cu | 342 +++++++++--------- ...50_simt_maximum_multiplies_ssrgemm_tn_n.cu | 342 +++++++++--------- ...50_simt_maximum_multiplies_ssrgemm_tn_t.cu | 342 +++++++++--------- ...50_simt_maximum_multiplies_ssrgemm_tt_n.cu | 342 +++++++++--------- ...50_simt_maximum_multiplies_ssrgemm_tt_t.cu | 342 +++++++++--------- .../sm50_simt_maximum_plus_dsrgemm_nn_n.cu | 216 +++++------ .../sm50_simt_maximum_plus_dsrgemm_nn_t.cu | 216 +++++------ .../sm50_simt_maximum_plus_dsrgemm_nt_n.cu | 216 +++++------ .../sm50_simt_maximum_plus_dsrgemm_nt_t.cu | 216 +++++------ .../sm50_simt_maximum_plus_dsrgemm_tn_n.cu | 216 +++++------ .../sm50_simt_maximum_plus_dsrgemm_tn_t.cu | 216 +++++------ .../sm50_simt_maximum_plus_dsrgemm_tt_n.cu | 216 +++++------ .../sm50_simt_maximum_plus_dsrgemm_tt_t.cu | 216 +++++------ .../sm50_simt_maximum_plus_ssrgemm_nn_n.cu | 342 +++++++++--------- .../sm50_simt_maximum_plus_ssrgemm_nn_t.cu | 342 +++++++++--------- .../sm50_simt_maximum_plus_ssrgemm_nt_n.cu | 342 +++++++++--------- .../sm50_simt_maximum_plus_ssrgemm_nt_t.cu | 342 +++++++++--------- .../sm50_simt_maximum_plus_ssrgemm_tn_n.cu | 342 +++++++++--------- .../sm50_simt_maximum_plus_ssrgemm_tn_t.cu | 342 +++++++++--------- .../sm50_simt_maximum_plus_ssrgemm_tt_n.cu | 342 +++++++++--------- .../sm50_simt_maximum_plus_ssrgemm_tt_t.cu | 342 +++++++++--------- .../sm50_simt_minimum_maximum_dsrgemm_nn_n.cu | 216 +++++------ .../sm50_simt_minimum_maximum_dsrgemm_nn_t.cu | 216 +++++------ .../sm50_simt_minimum_maximum_dsrgemm_nt_n.cu | 216 +++++------ .../sm50_simt_minimum_maximum_dsrgemm_nt_t.cu | 216 +++++------ .../sm50_simt_minimum_maximum_dsrgemm_tn_n.cu | 216 +++++------ .../sm50_simt_minimum_maximum_dsrgemm_tn_t.cu | 216 +++++------ .../sm50_simt_minimum_maximum_dsrgemm_tt_n.cu | 216 +++++------ .../sm50_simt_minimum_maximum_dsrgemm_tt_t.cu | 216 +++++------ .../sm50_simt_minimum_maximum_ssrgemm_nn_n.cu | 342 +++++++++--------- .../sm50_simt_minimum_maximum_ssrgemm_nn_t.cu | 342 +++++++++--------- .../sm50_simt_minimum_maximum_ssrgemm_nt_n.cu | 342 +++++++++--------- .../sm50_simt_minimum_maximum_ssrgemm_nt_t.cu | 342 +++++++++--------- .../sm50_simt_minimum_maximum_ssrgemm_tn_n.cu | 342 +++++++++--------- .../sm50_simt_minimum_maximum_ssrgemm_tn_t.cu | 342 +++++++++--------- .../sm50_simt_minimum_maximum_ssrgemm_tt_n.cu | 342 +++++++++--------- .../sm50_simt_minimum_maximum_ssrgemm_tt_t.cu | 342 +++++++++--------- ...50_simt_minimum_multiplies_dsrgemm_nn_n.cu | 216 +++++------ ...50_simt_minimum_multiplies_dsrgemm_nn_t.cu | 216 +++++------ ...50_simt_minimum_multiplies_dsrgemm_nt_n.cu | 216 +++++------ ...50_simt_minimum_multiplies_dsrgemm_nt_t.cu | 216 +++++------ ...50_simt_minimum_multiplies_dsrgemm_tn_n.cu | 216 +++++------ ...50_simt_minimum_multiplies_dsrgemm_tn_t.cu | 216 +++++------ ...50_simt_minimum_multiplies_dsrgemm_tt_n.cu | 216 +++++------ ...50_simt_minimum_multiplies_dsrgemm_tt_t.cu | 216 +++++------ ...50_simt_minimum_multiplies_ssrgemm_nn_n.cu | 342 +++++++++--------- ...50_simt_minimum_multiplies_ssrgemm_nn_t.cu | 342 +++++++++--------- ...50_simt_minimum_multiplies_ssrgemm_nt_n.cu | 342 +++++++++--------- ...50_simt_minimum_multiplies_ssrgemm_nt_t.cu | 342 +++++++++--------- ...50_simt_minimum_multiplies_ssrgemm_tn_n.cu | 342 +++++++++--------- ...50_simt_minimum_multiplies_ssrgemm_tn_t.cu | 342 +++++++++--------- ...50_simt_minimum_multiplies_ssrgemm_tt_n.cu | 342 +++++++++--------- ...50_simt_minimum_multiplies_ssrgemm_tt_t.cu | 342 +++++++++--------- .../sm50_simt_minimum_plus_dsrgemm_nn_n.cu | 216 +++++------ .../sm50_simt_minimum_plus_dsrgemm_nn_t.cu | 216 +++++------ .../sm50_simt_minimum_plus_dsrgemm_nt_n.cu | 216 +++++------ .../sm50_simt_minimum_plus_dsrgemm_nt_t.cu | 216 +++++------ .../sm50_simt_minimum_plus_dsrgemm_tn_n.cu | 216 +++++------ .../sm50_simt_minimum_plus_dsrgemm_tn_t.cu | 216 +++++------ .../sm50_simt_minimum_plus_dsrgemm_tt_n.cu | 216 +++++------ .../sm50_simt_minimum_plus_dsrgemm_tt_t.cu | 216 +++++------ .../sm50_simt_minimum_plus_ssrgemm_nn_n.cu | 342 +++++++++--------- .../sm50_simt_minimum_plus_ssrgemm_nn_t.cu | 342 +++++++++--------- .../sm50_simt_minimum_plus_ssrgemm_nt_n.cu | 342 +++++++++--------- .../sm50_simt_minimum_plus_ssrgemm_nt_t.cu | 342 +++++++++--------- .../sm50_simt_minimum_plus_ssrgemm_tn_n.cu | 342 +++++++++--------- .../sm50_simt_minimum_plus_ssrgemm_tn_t.cu | 342 +++++++++--------- .../sm50_simt_minimum_plus_ssrgemm_tt_n.cu | 342 +++++++++--------- .../sm50_simt_minimum_plus_ssrgemm_tt_t.cu | 342 +++++++++--------- .../sm50_simt_plus_multiplies_dsrgemm_nn_n.cu | 216 +++++------ .../sm50_simt_plus_multiplies_dsrgemm_nn_t.cu | 216 +++++------ .../sm50_simt_plus_multiplies_dsrgemm_nt_n.cu | 216 +++++------ .../sm50_simt_plus_multiplies_dsrgemm_nt_t.cu | 216 +++++------ .../sm50_simt_plus_multiplies_dsrgemm_tn_n.cu | 216 +++++------ .../sm50_simt_plus_multiplies_dsrgemm_tn_t.cu | 216 +++++------ .../sm50_simt_plus_multiplies_dsrgemm_tt_n.cu | 216 +++++------ .../sm50_simt_plus_multiplies_dsrgemm_tt_t.cu | 216 +++++------ .../sm50_simt_plus_multiplies_ssrgemm_nn_n.cu | 342 +++++++++--------- .../sm50_simt_plus_multiplies_ssrgemm_nn_t.cu | 342 +++++++++--------- .../sm50_simt_plus_multiplies_ssrgemm_nt_n.cu | 342 +++++++++--------- .../sm50_simt_plus_multiplies_ssrgemm_nt_t.cu | 342 +++++++++--------- .../sm50_simt_plus_multiplies_ssrgemm_tn_n.cu | 342 +++++++++--------- .../sm50_simt_plus_multiplies_ssrgemm_tn_t.cu | 342 +++++++++--------- .../sm50_simt_plus_multiplies_ssrgemm_tt_n.cu | 342 +++++++++--------- .../sm50_simt_plus_multiplies_ssrgemm_tt_t.cu | 342 +++++++++--------- test/regress/src/cutlass_srgemm.cu | 4 +- 262 files changed, 35749 insertions(+), 35744 deletions(-) diff --git a/bench/device/gen_simt.py b/bench/device/gen_simt.py index 6e884c8..7c2b466 100644 --- a/bench/device/gen_simt.py +++ b/bench/device/gen_simt.py @@ -95,9 +95,9 @@ using WarpShape = cutlass::gemm::GemmShape<{13}, {14}, {12}>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::{0}, cuasr::{1}, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::{0}, cuasr::{1}, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_n.cu b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_n.cu index 1573e38..37efb49 100644 --- a/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_n.cu +++ b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_8x32x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_16x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_16x64x8_16x64x1_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_32x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_8x32x8_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_8x64x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_16x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_16x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_16x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_32x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_32x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_32x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_64x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_16x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_16x64x8_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_32x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_32x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_32x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_64x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_64x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_128x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_16x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_16x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_32x32x8_16x8x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_32x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_32x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_64x64x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_32x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_64x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_64x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_128x32x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_32x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_32x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_64x32x16_16x8x1_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_64x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_n_128x32x16_32x8x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_t.cu b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_t.cu index ebf1e47..4c3c1df 100644 --- a/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_t.cu +++ b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_8x32x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_16x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_16x64x8_16x64x1_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_32x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_8x32x8_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_8x64x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_16x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_16x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_16x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_32x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_32x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_32x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_64x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_16x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_16x64x8_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_32x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_32x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_32x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_64x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_64x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_128x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_16x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_16x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_32x32x8_16x8x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_32x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_32x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_64x64x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_32x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_64x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_64x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_128x32x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_32x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_32x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_64x32x16_16x8x1_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_64x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nn_t_128x32x16_32x8x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_n.cu b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_n.cu index 22f4653..cc02061 100644 --- a/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_n.cu +++ b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_8x32x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_16x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_16x64x8_16x64x1_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_32x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_8x32x8_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_8x64x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_16x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_16x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_16x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_32x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_32x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_32x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_64x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_16x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_16x64x8_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_32x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_32x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_32x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_64x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_64x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_128x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_16x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_16x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_32x32x8_16x8x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_32x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_32x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_64x64x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_32x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_64x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_64x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_128x32x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_32x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_32x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_64x32x16_16x8x1_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_64x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_n_128x32x16_32x8x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_t.cu b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_t.cu index b4a6ded..1123169 100644 --- a/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_t.cu +++ b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_8x32x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_16x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_16x64x8_16x64x1_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_32x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_8x32x8_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_8x64x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_16x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_16x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_16x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_32x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_32x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_32x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_64x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_16x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_16x64x8_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_32x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_32x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_32x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_64x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_64x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_128x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_16x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_16x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_32x32x8_16x8x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_32x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_32x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_64x64x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_32x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_64x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_64x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_128x32x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_32x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_32x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_64x32x16_16x8x1_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_64x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_nt_t_128x32x16_32x8x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_n.cu b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_n.cu index 30bb6b7..fc4d354 100644 --- a/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_n.cu +++ b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_8x32x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_16x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_16x64x8_16x64x1_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_32x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_8x32x8_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_8x64x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_16x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_16x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_16x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_32x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_32x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_32x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_64x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_16x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_16x64x8_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_32x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_32x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_32x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_64x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_64x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_128x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_16x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_16x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_32x32x8_16x8x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_32x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_32x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_64x64x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_32x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_64x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_64x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_128x32x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_32x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_32x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_64x32x16_16x8x1_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_64x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_n_128x32x16_32x8x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_t.cu b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_t.cu index 2e9673e..c5f2f9c 100644 --- a/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_t.cu +++ b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_8x32x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_16x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_16x64x8_16x64x1_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_32x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_8x32x8_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_8x64x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_16x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_16x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_16x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_32x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_32x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_32x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_64x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_16x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_16x64x8_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_32x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_32x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_32x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_64x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_64x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_128x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_16x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_16x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_32x32x8_16x8x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_32x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_32x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_64x64x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_32x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_64x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_64x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_128x32x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_32x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_32x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_64x32x16_16x8x1_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_64x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tn_t_128x32x16_32x8x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_n.cu b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_n.cu index 413790d..ff7c154 100644 --- a/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_n.cu +++ b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_8x32x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_16x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_16x64x8_16x64x1_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_32x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_8x32x8_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_8x64x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_16x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_16x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_16x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_32x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_32x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_32x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_64x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_16x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_16x64x8_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_32x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_32x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_32x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_64x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_64x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_128x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_16x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_16x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_32x32x8_16x8x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_32x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_32x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_64x64x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_32x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_64x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_64x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_128x32x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_32x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_32x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_64x32x16_16x8x1_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_64x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_n_128x32x16_32x8x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_t.cu b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_t.cu index 4078e77..9e8f6da 100644 --- a/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_t.cu +++ b/bench/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_8x32x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_16x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_16x64x8_16x64x1_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_32x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_8x32x8_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_8x64x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_16x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_16x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_16x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_32x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_32x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_32x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_64x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_16x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_16x64x8_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_32x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_32x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_32x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_64x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_64x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_128x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_16x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_16x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_32x32x8_16x8x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_32x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_32x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_64x64x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_32x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_64x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_64x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_128x32x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_32x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_32x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_64x32x16_16x8x1_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_64x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_binary_or_binary_and_dsrgemm_tt_t_128x32x16_32x8x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_n.cu b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_n.cu index 9da2e71..7731c84 100644 --- a/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_n.cu +++ b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_8x32x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_16x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_16x64x8_16x64x1_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_32x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_32x64x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_64x32x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_8x32x8_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_8x64x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_16x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_16x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_16x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_32x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_32x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_32x128x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_64x64x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_32x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_64x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_64x64x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_128x32x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_16x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_16x64x8_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_32x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_32x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_32x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_64x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_64x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_64x128x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_128x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_128x64x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_16x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_16x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_32x32x8_16x8x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_32x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_32x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_32x256x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_64x64x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_64x128x8_32x32x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_64x256x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_128x128x8_64x32x1_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_32x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_64x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_64x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_128x32x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_128x64x8_32x32x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_128x128x8_32x64x1_8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_256x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_256x64x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_32x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_32x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_64x32x16_16x8x1_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_64x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_64x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_64x256x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_128x32x16_32x8x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_128x64x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_128x128x8_32x32x1_8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_n_256x64x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_t.cu b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_t.cu index d144940..7168b66 100644 --- a/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_t.cu +++ b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_8x32x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_16x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_16x64x8_16x64x1_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_32x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_32x64x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_64x32x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_8x32x8_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_8x64x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_16x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_16x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_16x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_32x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_32x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_32x128x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_64x64x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_32x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_64x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_64x64x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_128x32x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_16x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_16x64x8_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_32x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_32x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_32x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_64x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_64x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_64x128x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_128x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_128x64x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_16x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_16x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_32x32x8_16x8x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_32x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_32x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_32x256x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_64x64x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_64x128x8_32x32x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_64x256x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_128x128x8_64x32x1_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_32x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_64x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_64x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_128x32x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_128x64x8_32x32x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_128x128x8_32x64x1_8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_256x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_256x64x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_32x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_32x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_64x32x16_16x8x1_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_64x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_64x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_64x256x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_128x32x16_32x8x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_128x64x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_128x128x8_32x32x1_8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nn_t_256x64x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_n.cu b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_n.cu index e2b3ec8..b18a078 100644 --- a/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_n.cu +++ b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_8x32x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_16x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_16x64x8_16x64x1_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_32x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_32x64x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_64x32x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_8x32x8_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_8x64x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_16x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_16x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_16x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_32x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_32x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_32x128x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_64x64x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_32x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_64x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_64x64x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_128x32x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_16x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_16x64x8_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_32x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_32x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_32x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_64x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_64x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_64x128x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_128x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_128x64x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_16x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_16x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_32x32x8_16x8x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_32x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_32x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_32x256x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_64x64x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_64x128x8_32x32x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_64x256x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_128x128x8_64x32x1_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_32x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_64x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_64x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_128x32x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_128x64x8_32x32x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_128x128x8_32x64x1_8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_256x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_256x64x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_32x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_32x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_64x32x16_16x8x1_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_64x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_64x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_64x256x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_128x32x16_32x8x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_128x64x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_128x128x8_32x32x1_8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_n_256x64x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_t.cu b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_t.cu index 4a24d59..dc57afd 100644 --- a/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_t.cu +++ b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_8x32x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_16x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_16x64x8_16x64x1_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_32x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_32x64x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_64x32x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_8x32x8_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_8x64x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_16x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_16x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_16x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_32x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_32x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_32x128x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_64x64x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_32x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_64x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_64x64x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_128x32x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_16x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_16x64x8_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_32x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_32x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_32x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_64x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_64x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_64x128x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_128x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_128x64x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_16x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_16x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_32x32x8_16x8x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_32x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_32x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_32x256x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_64x64x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_64x128x8_32x32x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_64x256x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_128x128x8_64x32x1_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_32x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_64x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_64x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_128x32x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_128x64x8_32x32x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_128x128x8_32x64x1_8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_256x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_256x64x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_32x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_32x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_64x32x16_16x8x1_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_64x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_64x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_64x256x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_128x32x16_32x8x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_128x64x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_128x128x8_32x32x1_8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_nt_t_256x64x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_n.cu b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_n.cu index 7cf2777..1186fa3 100644 --- a/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_n.cu +++ b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_8x32x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_16x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_16x64x8_16x64x1_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_32x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_32x64x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_64x32x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_8x32x8_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_8x64x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_16x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_16x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_16x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_32x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_32x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_32x128x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_64x64x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_32x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_64x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_64x64x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_128x32x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_16x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_16x64x8_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_32x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_32x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_32x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_64x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_64x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_64x128x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_128x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_128x64x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_16x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_16x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_32x32x8_16x8x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_32x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_32x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_32x256x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_64x64x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_64x128x8_32x32x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_64x256x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_128x128x8_64x32x1_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_32x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_64x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_64x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_128x32x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_128x64x8_32x32x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_128x128x8_32x64x1_8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_256x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_256x64x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_32x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_32x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_64x32x16_16x8x1_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_64x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_64x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_64x256x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_128x32x16_32x8x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_128x64x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_128x128x8_32x32x1_8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_n_256x64x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_t.cu b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_t.cu index e98898d..1d8f269 100644 --- a/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_t.cu +++ b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_8x32x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_16x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_16x64x8_16x64x1_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_32x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_32x64x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_64x32x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_8x32x8_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_8x64x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_16x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_16x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_16x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_32x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_32x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_32x128x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_64x64x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_32x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_64x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_64x64x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_128x32x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_16x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_16x64x8_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_32x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_32x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_32x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_64x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_64x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_64x128x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_128x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_128x64x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_16x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_16x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_32x32x8_16x8x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_32x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_32x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_32x256x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_64x64x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_64x128x8_32x32x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_64x256x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_128x128x8_64x32x1_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_32x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_64x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_64x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_128x32x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_128x64x8_32x32x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_128x128x8_32x64x1_8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_256x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_256x64x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_32x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_32x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_64x32x16_16x8x1_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_64x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_64x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_64x256x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_128x32x16_32x8x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_128x64x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_128x128x8_32x32x1_8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tn_t_256x64x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_n.cu b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_n.cu index 48e8bcb..da056ea 100644 --- a/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_n.cu +++ b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_8x32x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_16x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_16x64x8_16x64x1_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_32x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_32x64x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_64x32x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_8x32x8_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_8x64x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_16x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_16x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_16x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_32x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_32x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_32x128x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_64x64x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_32x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_64x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_64x64x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_128x32x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_16x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_16x64x8_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_32x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_32x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_32x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_64x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_64x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_64x128x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_128x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_128x64x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_16x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_16x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_32x32x8_16x8x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_32x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_32x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_32x256x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_64x64x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_64x128x8_32x32x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_64x256x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_128x128x8_64x32x1_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_32x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_64x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_64x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_128x32x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_128x64x8_32x32x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_128x128x8_32x64x1_8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_256x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_256x64x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_32x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_32x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_64x32x16_16x8x1_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_64x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_64x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_64x256x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_128x32x16_32x8x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_128x64x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_128x128x8_32x32x1_8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_n_256x64x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_t.cu b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_t.cu index b2ece1d..ee840a1 100644 --- a/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_t.cu +++ b/bench/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_8x32x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_16x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_16x64x8_16x64x1_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_32x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_32x64x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_64x32x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_8x32x8_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_8x64x8_8x32x1_2x4_4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_16x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_16x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_16x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_32x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_32x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_32x128x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_64x64x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_32x32x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_64x32x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_64x64x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_128x32x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_16x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_16x64x8_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_32x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_32x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_32x128x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_64x32x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_64x64x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_64x128x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_128x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_128x64x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_16x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_16x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_32x32x8_16x8x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_32x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_32x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_32x256x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_64x64x8_32x16x1_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_64x128x8_32x32x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_64x256x8_32x64x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_128x128x8_64x32x1_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_32x32x8_8x16x1_2x2_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_64x32x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_64x64x8_16x32x1_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_128x32x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_128x64x8_32x32x1_8x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_128x128x8_32x64x1_8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_256x32x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_256x64x8_64x32x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_32x64x16_8x16x1_2x2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_32x128x16_8x32x1_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_64x32x16_16x8x1_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_64x64x8_16x16x1_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_64x128x8_16x32x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_64x256x8_16x64x1_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_128x32x16_32x8x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_128x64x8_32x16x1_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_128x128x8_32x32x1_8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_binary_or_binary_and_ssrgemm_tt_t_256x64x8_64x16x1_8x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_minimum_dsrgemm_nn_n.cu b/bench/device/sm50_simt_maximum_minimum_dsrgemm_nn_n.cu index 578387d..5d75475 100644 --- a/bench/device/sm50_simt_maximum_minimum_dsrgemm_nn_n.cu +++ b/bench/device/sm50_simt_maximum_minimum_dsrgemm_nn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_minimum_dsrgemm_nn_t.cu b/bench/device/sm50_simt_maximum_minimum_dsrgemm_nn_t.cu index f4ac483..bc1772f 100644 --- a/bench/device/sm50_simt_maximum_minimum_dsrgemm_nn_t.cu +++ b/bench/device/sm50_simt_maximum_minimum_dsrgemm_nn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nn_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_minimum_dsrgemm_nt_n.cu b/bench/device/sm50_simt_maximum_minimum_dsrgemm_nt_n.cu index de5e233..73d15f6 100644 --- a/bench/device/sm50_simt_maximum_minimum_dsrgemm_nt_n.cu +++ b/bench/device/sm50_simt_maximum_minimum_dsrgemm_nt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_minimum_dsrgemm_nt_t.cu b/bench/device/sm50_simt_maximum_minimum_dsrgemm_nt_t.cu index 945aee0..2c2cf7a 100644 --- a/bench/device/sm50_simt_maximum_minimum_dsrgemm_nt_t.cu +++ b/bench/device/sm50_simt_maximum_minimum_dsrgemm_nt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_nt_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_minimum_dsrgemm_tn_n.cu b/bench/device/sm50_simt_maximum_minimum_dsrgemm_tn_n.cu index 0087de9..fc7583a 100644 --- a/bench/device/sm50_simt_maximum_minimum_dsrgemm_tn_n.cu +++ b/bench/device/sm50_simt_maximum_minimum_dsrgemm_tn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_minimum_dsrgemm_tn_t.cu b/bench/device/sm50_simt_maximum_minimum_dsrgemm_tn_t.cu index 9f35d41..d02d958 100644 --- a/bench/device/sm50_simt_maximum_minimum_dsrgemm_tn_t.cu +++ b/bench/device/sm50_simt_maximum_minimum_dsrgemm_tn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tn_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_minimum_dsrgemm_tt_n.cu b/bench/device/sm50_simt_maximum_minimum_dsrgemm_tt_n.cu index ca868f6..d347da6 100644 --- a/bench/device/sm50_simt_maximum_minimum_dsrgemm_tt_n.cu +++ b/bench/device/sm50_simt_maximum_minimum_dsrgemm_tt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_minimum_dsrgemm_tt_t.cu b/bench/device/sm50_simt_maximum_minimum_dsrgemm_tt_t.cu index 1a70c9d..2df5698 100644 --- a/bench/device/sm50_simt_maximum_minimum_dsrgemm_tt_t.cu +++ b/bench/device/sm50_simt_maximum_minimum_dsrgemm_tt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_minimum_dsrgemm_tt_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_minimum_ssrgemm_nn_n.cu b/bench/device/sm50_simt_maximum_minimum_ssrgemm_nn_n.cu index 7812c2c..ee63676 100644 --- a/bench/device/sm50_simt_maximum_minimum_ssrgemm_nn_n.cu +++ b/bench/device/sm50_simt_maximum_minimum_ssrgemm_nn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_n_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_minimum_ssrgemm_nn_t.cu b/bench/device/sm50_simt_maximum_minimum_ssrgemm_nn_t.cu index c73ae69..c629ad9 100644 --- a/bench/device/sm50_simt_maximum_minimum_ssrgemm_nn_t.cu +++ b/bench/device/sm50_simt_maximum_minimum_ssrgemm_nn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nn_t_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_minimum_ssrgemm_nt_n.cu b/bench/device/sm50_simt_maximum_minimum_ssrgemm_nt_n.cu index 2807465..d7425b4 100644 --- a/bench/device/sm50_simt_maximum_minimum_ssrgemm_nt_n.cu +++ b/bench/device/sm50_simt_maximum_minimum_ssrgemm_nt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_n_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_minimum_ssrgemm_nt_t.cu b/bench/device/sm50_simt_maximum_minimum_ssrgemm_nt_t.cu index 2127978..0cde15d 100644 --- a/bench/device/sm50_simt_maximum_minimum_ssrgemm_nt_t.cu +++ b/bench/device/sm50_simt_maximum_minimum_ssrgemm_nt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_nt_t_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_minimum_ssrgemm_tn_n.cu b/bench/device/sm50_simt_maximum_minimum_ssrgemm_tn_n.cu index ab4bf33..da5b1ce 100644 --- a/bench/device/sm50_simt_maximum_minimum_ssrgemm_tn_n.cu +++ b/bench/device/sm50_simt_maximum_minimum_ssrgemm_tn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_n_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_minimum_ssrgemm_tn_t.cu b/bench/device/sm50_simt_maximum_minimum_ssrgemm_tn_t.cu index 428979a..5191e74 100644 --- a/bench/device/sm50_simt_maximum_minimum_ssrgemm_tn_t.cu +++ b/bench/device/sm50_simt_maximum_minimum_ssrgemm_tn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tn_t_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_minimum_ssrgemm_tt_n.cu b/bench/device/sm50_simt_maximum_minimum_ssrgemm_tt_n.cu index 2a27f44..82f46f0 100644 --- a/bench/device/sm50_simt_maximum_minimum_ssrgemm_tt_n.cu +++ b/bench/device/sm50_simt_maximum_minimum_ssrgemm_tt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_n_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_minimum_ssrgemm_tt_t.cu b/bench/device/sm50_simt_maximum_minimum_ssrgemm_tt_t.cu index ba34829..3a74dc8 100644 --- a/bench/device/sm50_simt_maximum_minimum_ssrgemm_tt_t.cu +++ b/bench/device/sm50_simt_maximum_minimum_ssrgemm_tt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_minimum_ssrgemm_tt_t_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nn_n.cu b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nn_n.cu index 9591333..da6528a 100644 --- a/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nn_n.cu +++ b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_n_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nn_t.cu b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nn_t.cu index f6cb9f2..38d926d 100644 --- a/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nn_t.cu +++ b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nn_t_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nt_n.cu b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nt_n.cu index 7469cac..d63bd71 100644 --- a/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nt_n.cu +++ b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_n_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nt_t.cu b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nt_t.cu index 71f2a55..dcd179d 100644 --- a/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nt_t.cu +++ b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_nt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_nt_t_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tn_n.cu b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tn_n.cu index bedb8cb..0fde3c0 100644 --- a/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tn_n.cu +++ b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_n_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tn_t.cu b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tn_t.cu index 9201e57..c3d076a 100644 --- a/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tn_t.cu +++ b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tn_t_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tt_n.cu b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tt_n.cu index 6b247c9..b0e44bb 100644 --- a/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tt_n.cu +++ b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_n_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tt_t.cu b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tt_t.cu index 6c62ab9..b0a5a07 100644 --- a/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tt_t.cu +++ b/bench/device/sm50_simt_maximum_multiplies_dsrgemm_tt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_multiplies_dsrgemm_tt_t_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nn_n.cu b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nn_n.cu index 678313c..7d073d2 100644 --- a/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nn_n.cu +++ b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_32x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_64x32x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_32x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_64x64x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_64x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_128x32x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_64x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_128x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_32x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_64x128x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_64x256x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_128x128x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_128x64x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_128x128x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_256x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_256x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_64x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_64x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_128x64x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_128x128x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_n_256x64x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nn_t.cu b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nn_t.cu index 0730ca4..a42843a 100644 --- a/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nn_t.cu +++ b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_32x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_64x32x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_32x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_64x64x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_64x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_128x32x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_64x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_128x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_32x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_64x128x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_64x256x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_128x128x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_128x64x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_128x128x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_256x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_256x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_64x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_64x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_128x64x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_128x128x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nn_t_256x64x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nt_n.cu b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nt_n.cu index 205990d..852e99d 100644 --- a/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nt_n.cu +++ b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_32x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_64x32x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_32x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_64x64x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_64x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_128x32x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_64x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_128x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_32x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_64x128x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_64x256x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_128x128x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_128x64x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_128x128x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_256x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_256x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_64x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_64x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_128x64x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_128x128x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_n_256x64x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nt_t.cu b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nt_t.cu index 1965e89..8b787f5 100644 --- a/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nt_t.cu +++ b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_nt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_32x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_64x32x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_32x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_64x64x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_64x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_128x32x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_64x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_128x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_32x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_64x128x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_64x256x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_128x128x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_128x64x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_128x128x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_256x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_256x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_64x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_64x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_128x64x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_128x128x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_nt_t_256x64x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tn_n.cu b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tn_n.cu index e2b3445..72643b9 100644 --- a/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tn_n.cu +++ b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_32x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_64x32x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_32x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_64x64x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_64x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_128x32x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_64x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_128x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_32x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_64x128x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_64x256x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_128x128x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_128x64x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_128x128x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_256x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_256x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_64x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_64x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_128x64x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_128x128x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_n_256x64x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tn_t.cu b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tn_t.cu index 05e2794..d47d9d0 100644 --- a/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tn_t.cu +++ b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_32x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_64x32x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_32x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_64x64x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_64x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_128x32x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_64x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_128x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_32x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_64x128x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_64x256x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_128x128x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_128x64x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_128x128x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_256x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_256x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_64x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_64x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_128x64x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_128x128x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tn_t_256x64x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tt_n.cu b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tt_n.cu index af4b94a..979ed4a 100644 --- a/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tt_n.cu +++ b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_32x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_64x32x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_32x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_64x64x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_64x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_128x32x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_64x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_128x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_32x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_64x128x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_64x256x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_128x128x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_128x64x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_128x128x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_256x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_256x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_64x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_64x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_128x64x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_128x128x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_n_256x64x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tt_t.cu b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tt_t.cu index e014bac..a962894 100644 --- a/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tt_t.cu +++ b/bench/device/sm50_simt_maximum_multiplies_ssrgemm_tt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_32x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_64x32x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_32x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_64x64x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_64x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_128x32x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_64x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_128x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_32x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_64x128x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_64x256x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_128x128x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_128x64x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_128x128x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_256x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_256x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_64x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_64x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_128x64x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_128x128x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_multiplies_ssrgemm_tt_t_256x64x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_plus_dsrgemm_nn_n.cu b/bench/device/sm50_simt_maximum_plus_dsrgemm_nn_n.cu index 9afe221..c3f6094 100644 --- a/bench/device/sm50_simt_maximum_plus_dsrgemm_nn_n.cu +++ b/bench/device/sm50_simt_maximum_plus_dsrgemm_nn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_n_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_plus_dsrgemm_nn_t.cu b/bench/device/sm50_simt_maximum_plus_dsrgemm_nn_t.cu index dcac1f3..292a9df 100644 --- a/bench/device/sm50_simt_maximum_plus_dsrgemm_nn_t.cu +++ b/bench/device/sm50_simt_maximum_plus_dsrgemm_nn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nn_t_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_plus_dsrgemm_nt_n.cu b/bench/device/sm50_simt_maximum_plus_dsrgemm_nt_n.cu index cfed1c5..ce33c3e 100644 --- a/bench/device/sm50_simt_maximum_plus_dsrgemm_nt_n.cu +++ b/bench/device/sm50_simt_maximum_plus_dsrgemm_nt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_n_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_plus_dsrgemm_nt_t.cu b/bench/device/sm50_simt_maximum_plus_dsrgemm_nt_t.cu index 327485e..a680755 100644 --- a/bench/device/sm50_simt_maximum_plus_dsrgemm_nt_t.cu +++ b/bench/device/sm50_simt_maximum_plus_dsrgemm_nt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_nt_t_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_plus_dsrgemm_tn_n.cu b/bench/device/sm50_simt_maximum_plus_dsrgemm_tn_n.cu index 2cecd50..0188cc1 100644 --- a/bench/device/sm50_simt_maximum_plus_dsrgemm_tn_n.cu +++ b/bench/device/sm50_simt_maximum_plus_dsrgemm_tn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_n_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_plus_dsrgemm_tn_t.cu b/bench/device/sm50_simt_maximum_plus_dsrgemm_tn_t.cu index 42af41e..21bbb72 100644 --- a/bench/device/sm50_simt_maximum_plus_dsrgemm_tn_t.cu +++ b/bench/device/sm50_simt_maximum_plus_dsrgemm_tn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tn_t_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_plus_dsrgemm_tt_n.cu b/bench/device/sm50_simt_maximum_plus_dsrgemm_tt_n.cu index 7ccb50d..4ba3940 100644 --- a/bench/device/sm50_simt_maximum_plus_dsrgemm_tt_n.cu +++ b/bench/device/sm50_simt_maximum_plus_dsrgemm_tt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_n_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_plus_dsrgemm_tt_t.cu b/bench/device/sm50_simt_maximum_plus_dsrgemm_tt_t.cu index 120e463..ddaaf9a 100644 --- a/bench/device/sm50_simt_maximum_plus_dsrgemm_tt_t.cu +++ b/bench/device/sm50_simt_maximum_plus_dsrgemm_tt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_plus_dsrgemm_tt_t_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_plus_ssrgemm_nn_n.cu b/bench/device/sm50_simt_maximum_plus_ssrgemm_nn_n.cu index 38f0663..8c6a834 100644 --- a/bench/device/sm50_simt_maximum_plus_ssrgemm_nn_n.cu +++ b/bench/device/sm50_simt_maximum_plus_ssrgemm_nn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_32x64x8_32x64x1_8x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_64x32x8_64x32x1_8x8_8x4_1x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_32x128x8_32x64x1_8x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_64x64x8_64x32x1_8x8_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_64x64x8_32x64x1_8x8_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_128x32x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_64x128x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_128x64x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_32x256x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_64x128x8_32x32x1_8x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_64x256x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_128x128x8_64x32x1_8x8_8x4_2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_128x64x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_128x128x8_32x64x1_8x8_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_256x32x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_256x64x8_64x32x1_8x8_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_64x128x8_16x32x1_4x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_64x256x8_16x64x1_4x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_128x64x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_128x128x8_32x32x1_8x4_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_n_256x64x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_plus_ssrgemm_nn_t.cu b/bench/device/sm50_simt_maximum_plus_ssrgemm_nn_t.cu index 63bbfac..a3c60ca 100644 --- a/bench/device/sm50_simt_maximum_plus_ssrgemm_nn_t.cu +++ b/bench/device/sm50_simt_maximum_plus_ssrgemm_nn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_32x64x8_32x64x1_8x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_64x32x8_64x32x1_8x8_8x4_1x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_32x128x8_32x64x1_8x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_64x64x8_64x32x1_8x8_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_64x64x8_32x64x1_8x8_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_128x32x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_64x128x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_128x64x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_32x256x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_64x128x8_32x32x1_8x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_64x256x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_128x128x8_64x32x1_8x8_8x4_2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_128x64x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_128x128x8_32x64x1_8x8_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_256x32x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_256x64x8_64x32x1_8x8_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_64x128x8_16x32x1_4x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_64x256x8_16x64x1_4x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_128x64x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_128x128x8_32x32x1_8x4_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nn_t_256x64x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_plus_ssrgemm_nt_n.cu b/bench/device/sm50_simt_maximum_plus_ssrgemm_nt_n.cu index feb5e4c..065710e 100644 --- a/bench/device/sm50_simt_maximum_plus_ssrgemm_nt_n.cu +++ b/bench/device/sm50_simt_maximum_plus_ssrgemm_nt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_32x64x8_32x64x1_8x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_64x32x8_64x32x1_8x8_8x4_1x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_32x128x8_32x64x1_8x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_64x64x8_64x32x1_8x8_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_64x64x8_32x64x1_8x8_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_128x32x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_64x128x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_128x64x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_32x256x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_64x128x8_32x32x1_8x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_64x256x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_128x128x8_64x32x1_8x8_8x4_2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_128x64x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_128x128x8_32x64x1_8x8_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_256x32x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_256x64x8_64x32x1_8x8_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_64x128x8_16x32x1_4x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_64x256x8_16x64x1_4x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_128x64x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_128x128x8_32x32x1_8x4_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_n_256x64x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_plus_ssrgemm_nt_t.cu b/bench/device/sm50_simt_maximum_plus_ssrgemm_nt_t.cu index d432b83..fd9bc29 100644 --- a/bench/device/sm50_simt_maximum_plus_ssrgemm_nt_t.cu +++ b/bench/device/sm50_simt_maximum_plus_ssrgemm_nt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_32x64x8_32x64x1_8x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_64x32x8_64x32x1_8x8_8x4_1x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_32x128x8_32x64x1_8x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_64x64x8_64x32x1_8x8_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_64x64x8_32x64x1_8x8_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_128x32x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_64x128x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_128x64x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_32x256x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_64x128x8_32x32x1_8x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_64x256x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_128x128x8_64x32x1_8x8_8x4_2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_128x64x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_128x128x8_32x64x1_8x8_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_256x32x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_256x64x8_64x32x1_8x8_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_64x128x8_16x32x1_4x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_64x256x8_16x64x1_4x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_128x64x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_128x128x8_32x32x1_8x4_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_nt_t_256x64x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_plus_ssrgemm_tn_n.cu b/bench/device/sm50_simt_maximum_plus_ssrgemm_tn_n.cu index 770c4be..b143c0a 100644 --- a/bench/device/sm50_simt_maximum_plus_ssrgemm_tn_n.cu +++ b/bench/device/sm50_simt_maximum_plus_ssrgemm_tn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_32x64x8_32x64x1_8x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_64x32x8_64x32x1_8x8_8x4_1x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_32x128x8_32x64x1_8x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_64x64x8_64x32x1_8x8_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_64x64x8_32x64x1_8x8_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_128x32x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_64x128x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_128x64x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_32x256x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_64x128x8_32x32x1_8x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_64x256x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_128x128x8_64x32x1_8x8_8x4_2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_128x64x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_128x128x8_32x64x1_8x8_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_256x32x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_256x64x8_64x32x1_8x8_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_64x128x8_16x32x1_4x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_64x256x8_16x64x1_4x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_128x64x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_128x128x8_32x32x1_8x4_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_n_256x64x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_plus_ssrgemm_tn_t.cu b/bench/device/sm50_simt_maximum_plus_ssrgemm_tn_t.cu index 38a96a4..7ad52c0 100644 --- a/bench/device/sm50_simt_maximum_plus_ssrgemm_tn_t.cu +++ b/bench/device/sm50_simt_maximum_plus_ssrgemm_tn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_32x64x8_32x64x1_8x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_64x32x8_64x32x1_8x8_8x4_1x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_32x128x8_32x64x1_8x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_64x64x8_64x32x1_8x8_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_64x64x8_32x64x1_8x8_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_128x32x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_64x128x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_128x64x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_32x256x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_64x128x8_32x32x1_8x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_64x256x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_128x128x8_64x32x1_8x8_8x4_2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_128x64x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_128x128x8_32x64x1_8x8_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_256x32x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_256x64x8_64x32x1_8x8_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_64x128x8_16x32x1_4x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_64x256x8_16x64x1_4x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_128x64x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_128x128x8_32x32x1_8x4_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tn_t_256x64x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_plus_ssrgemm_tt_n.cu b/bench/device/sm50_simt_maximum_plus_ssrgemm_tt_n.cu index d25b3ce..adb45e8 100644 --- a/bench/device/sm50_simt_maximum_plus_ssrgemm_tt_n.cu +++ b/bench/device/sm50_simt_maximum_plus_ssrgemm_tt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_32x64x8_32x64x1_8x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_64x32x8_64x32x1_8x8_8x4_1x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_32x128x8_32x64x1_8x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_64x64x8_64x32x1_8x8_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_64x64x8_32x64x1_8x8_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_128x32x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_64x128x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_128x64x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_32x256x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_64x128x8_32x32x1_8x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_64x256x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_128x128x8_64x32x1_8x8_8x4_2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_128x64x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_128x128x8_32x64x1_8x8_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_256x32x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_256x64x8_64x32x1_8x8_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_64x128x8_16x32x1_4x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_64x256x8_16x64x1_4x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_128x64x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_128x128x8_32x32x1_8x4_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_n_256x64x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_maximum_plus_ssrgemm_tt_t.cu b/bench/device/sm50_simt_maximum_plus_ssrgemm_tt_t.cu index af15645..75566d4 100644 --- a/bench/device/sm50_simt_maximum_plus_ssrgemm_tt_t.cu +++ b/bench/device/sm50_simt_maximum_plus_ssrgemm_tt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_32x64x8_32x64x1_8x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_64x32x8_64x32x1_8x8_8x4_1x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_32x128x8_32x64x1_8x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_64x64x8_64x32x1_8x8_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_64x64x8_32x64x1_8x8_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_128x32x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_64x128x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_128x64x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_32x256x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_64x128x8_32x32x1_8x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_64x256x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_128x128x8_64x32x1_8x8_8x4_2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_128x64x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_128x128x8_32x64x1_8x8_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_256x32x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_256x64x8_64x32x1_8x8_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_64x128x8_16x32x1_4x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_64x256x8_16x64x1_4x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_128x64x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_128x128x8_32x32x1_8x4_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_maximum_plus_ssrgemm_tt_t_256x64x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_maximum_dsrgemm_nn_n.cu b/bench/device/sm50_simt_minimum_maximum_dsrgemm_nn_n.cu index 070c2c6..7ef087c 100644 --- a/bench/device/sm50_simt_minimum_maximum_dsrgemm_nn_n.cu +++ b/bench/device/sm50_simt_minimum_maximum_dsrgemm_nn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_maximum_dsrgemm_nn_t.cu b/bench/device/sm50_simt_minimum_maximum_dsrgemm_nn_t.cu index e6d2239..b3452c3 100644 --- a/bench/device/sm50_simt_minimum_maximum_dsrgemm_nn_t.cu +++ b/bench/device/sm50_simt_minimum_maximum_dsrgemm_nn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nn_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_maximum_dsrgemm_nt_n.cu b/bench/device/sm50_simt_minimum_maximum_dsrgemm_nt_n.cu index 5412493..57306bf 100644 --- a/bench/device/sm50_simt_minimum_maximum_dsrgemm_nt_n.cu +++ b/bench/device/sm50_simt_minimum_maximum_dsrgemm_nt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_maximum_dsrgemm_nt_t.cu b/bench/device/sm50_simt_minimum_maximum_dsrgemm_nt_t.cu index c537d86..66c04f4 100644 --- a/bench/device/sm50_simt_minimum_maximum_dsrgemm_nt_t.cu +++ b/bench/device/sm50_simt_minimum_maximum_dsrgemm_nt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_nt_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_maximum_dsrgemm_tn_n.cu b/bench/device/sm50_simt_minimum_maximum_dsrgemm_tn_n.cu index 1b98cb3..30f028d 100644 --- a/bench/device/sm50_simt_minimum_maximum_dsrgemm_tn_n.cu +++ b/bench/device/sm50_simt_minimum_maximum_dsrgemm_tn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_maximum_dsrgemm_tn_t.cu b/bench/device/sm50_simt_minimum_maximum_dsrgemm_tn_t.cu index 136e5b0..cfdf07e 100644 --- a/bench/device/sm50_simt_minimum_maximum_dsrgemm_tn_t.cu +++ b/bench/device/sm50_simt_minimum_maximum_dsrgemm_tn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tn_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_maximum_dsrgemm_tt_n.cu b/bench/device/sm50_simt_minimum_maximum_dsrgemm_tt_n.cu index 6c5950c..d76105f 100644 --- a/bench/device/sm50_simt_minimum_maximum_dsrgemm_tt_n.cu +++ b/bench/device/sm50_simt_minimum_maximum_dsrgemm_tt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_maximum_dsrgemm_tt_t.cu b/bench/device/sm50_simt_minimum_maximum_dsrgemm_tt_t.cu index ddeb7ee..623cf5b 100644 --- a/bench/device/sm50_simt_minimum_maximum_dsrgemm_tt_t.cu +++ b/bench/device/sm50_simt_minimum_maximum_dsrgemm_tt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_maximum_dsrgemm_tt_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_maximum_ssrgemm_nn_n.cu b/bench/device/sm50_simt_minimum_maximum_ssrgemm_nn_n.cu index 45c7417..a5efce9 100644 --- a/bench/device/sm50_simt_minimum_maximum_ssrgemm_nn_n.cu +++ b/bench/device/sm50_simt_minimum_maximum_ssrgemm_nn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_n_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_maximum_ssrgemm_nn_t.cu b/bench/device/sm50_simt_minimum_maximum_ssrgemm_nn_t.cu index f71960f..7607483 100644 --- a/bench/device/sm50_simt_minimum_maximum_ssrgemm_nn_t.cu +++ b/bench/device/sm50_simt_minimum_maximum_ssrgemm_nn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nn_t_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_maximum_ssrgemm_nt_n.cu b/bench/device/sm50_simt_minimum_maximum_ssrgemm_nt_n.cu index f05a891..2cd15b1 100644 --- a/bench/device/sm50_simt_minimum_maximum_ssrgemm_nt_n.cu +++ b/bench/device/sm50_simt_minimum_maximum_ssrgemm_nt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_n_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_maximum_ssrgemm_nt_t.cu b/bench/device/sm50_simt_minimum_maximum_ssrgemm_nt_t.cu index 9e59aea..03c00a7 100644 --- a/bench/device/sm50_simt_minimum_maximum_ssrgemm_nt_t.cu +++ b/bench/device/sm50_simt_minimum_maximum_ssrgemm_nt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_nt_t_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_maximum_ssrgemm_tn_n.cu b/bench/device/sm50_simt_minimum_maximum_ssrgemm_tn_n.cu index b5e1dd0..a3efbfb 100644 --- a/bench/device/sm50_simt_minimum_maximum_ssrgemm_tn_n.cu +++ b/bench/device/sm50_simt_minimum_maximum_ssrgemm_tn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_n_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_maximum_ssrgemm_tn_t.cu b/bench/device/sm50_simt_minimum_maximum_ssrgemm_tn_t.cu index 00ad4c6..4bcafc7 100644 --- a/bench/device/sm50_simt_minimum_maximum_ssrgemm_tn_t.cu +++ b/bench/device/sm50_simt_minimum_maximum_ssrgemm_tn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tn_t_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_maximum_ssrgemm_tt_n.cu b/bench/device/sm50_simt_minimum_maximum_ssrgemm_tt_n.cu index 7676bf6..c811be7 100644 --- a/bench/device/sm50_simt_minimum_maximum_ssrgemm_tt_n.cu +++ b/bench/device/sm50_simt_minimum_maximum_ssrgemm_tt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_n_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_maximum_ssrgemm_tt_t.cu b/bench/device/sm50_simt_minimum_maximum_ssrgemm_tt_t.cu index 01f8575..b4472b8 100644 --- a/bench/device/sm50_simt_minimum_maximum_ssrgemm_tt_t.cu +++ b/bench/device/sm50_simt_minimum_maximum_ssrgemm_tt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_maximum_ssrgemm_tt_t_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nn_n.cu b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nn_n.cu index 625baad..b302685 100644 --- a/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nn_n.cu +++ b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_n_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nn_t.cu b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nn_t.cu index 6f0dfef..3f14d37 100644 --- a/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nn_t.cu +++ b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nn_t_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nt_n.cu b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nt_n.cu index 44cc104..1cf940a 100644 --- a/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nt_n.cu +++ b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_n_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nt_t.cu b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nt_t.cu index a0adc1d..9e522e1 100644 --- a/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nt_t.cu +++ b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_nt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_nt_t_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tn_n.cu b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tn_n.cu index 13a2903..6dfc892 100644 --- a/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tn_n.cu +++ b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_n_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tn_t.cu b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tn_t.cu index c5ca3c9..db47670 100644 --- a/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tn_t.cu +++ b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tn_t_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tt_n.cu b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tt_n.cu index c5b8c24..541e51b 100644 --- a/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tt_n.cu +++ b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_n_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tt_t.cu b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tt_t.cu index 5445238..3064a03 100644 --- a/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tt_t.cu +++ b/bench/device/sm50_simt_minimum_multiplies_dsrgemm_tt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_multiplies_dsrgemm_tt_t_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nn_n.cu b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nn_n.cu index e1c3432..4678c6b 100644 --- a/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nn_n.cu +++ b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_32x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_64x32x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_32x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_64x64x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_64x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_128x32x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_64x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_128x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_32x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_64x128x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_64x256x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_128x128x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_128x64x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_128x128x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_256x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_256x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_64x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_64x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_128x64x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_128x128x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_n_256x64x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nn_t.cu b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nn_t.cu index 4e98030..e4469bb 100644 --- a/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nn_t.cu +++ b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_32x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_64x32x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_32x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_64x64x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_64x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_128x32x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_64x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_128x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_32x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_64x128x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_64x256x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_128x128x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_128x64x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_128x128x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_256x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_256x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_64x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_64x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_128x64x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_128x128x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nn_t_256x64x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nt_n.cu b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nt_n.cu index e4adac9..dc24cc7 100644 --- a/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nt_n.cu +++ b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_32x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_64x32x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_32x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_64x64x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_64x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_128x32x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_64x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_128x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_32x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_64x128x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_64x256x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_128x128x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_128x64x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_128x128x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_256x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_256x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_64x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_64x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_128x64x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_128x128x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_n_256x64x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nt_t.cu b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nt_t.cu index 37620e0..44a0f67 100644 --- a/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nt_t.cu +++ b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_nt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_32x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_64x32x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_32x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_64x64x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_64x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_128x32x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_64x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_128x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_32x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_64x128x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_64x256x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_128x128x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_128x64x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_128x128x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_256x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_256x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_64x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_64x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_128x64x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_128x128x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_nt_t_256x64x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tn_n.cu b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tn_n.cu index 04b377b..08457fa 100644 --- a/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tn_n.cu +++ b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_32x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_64x32x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_32x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_64x64x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_64x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_128x32x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_64x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_128x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_32x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_64x128x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_64x256x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_128x128x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_128x64x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_128x128x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_256x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_256x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_64x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_64x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_128x64x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_128x128x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_n_256x64x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tn_t.cu b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tn_t.cu index 41700e3..1d7ec5a 100644 --- a/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tn_t.cu +++ b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_32x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_64x32x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_32x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_64x64x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_64x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_128x32x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_64x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_128x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_32x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_64x128x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_64x256x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_128x128x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_128x64x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_128x128x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_256x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_256x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_64x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_64x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_128x64x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_128x128x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tn_t_256x64x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tt_n.cu b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tt_n.cu index e65807a..2d178cc 100644 --- a/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tt_n.cu +++ b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_32x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_64x32x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_32x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_64x64x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_64x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_128x32x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_64x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_128x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_32x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_64x128x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_64x256x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_128x128x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_128x64x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_128x128x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_256x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_256x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_64x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_64x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_128x64x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_128x128x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_n_256x64x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tt_t.cu b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tt_t.cu index b23ec39..dd8150d 100644 --- a/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tt_t.cu +++ b/bench/device/sm50_simt_minimum_multiplies_ssrgemm_tt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_8x32x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_16x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_16x64x8_16x64x1_4x8_4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_32x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_32x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_64x32x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_8x32x8_8x16x1_2x2_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_8x64x8_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_16x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_16x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_16x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_32x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_32x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_32x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_64x64x8_64x32x1_8x8_8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_32x32x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_64x32x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_64x64x8_32x64x1_8x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_128x32x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_16x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_16x64x8_8x32x1_2x4_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_32x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_32x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_32x128x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_64x32x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_64x64x8_32x32x1_8x4_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_64x128x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_128x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_128x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_16x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_16x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_32x32x8_16x8x1_2x2_8x using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_32x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_32x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_32x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_64x64x8_32x16x1_4x4_8 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_64x128x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_64x256x8_32x64x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_128x128x8_64x32x1_8x8 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_32x32x8_8x16x1_2x2_4x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_64x32x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_64x64x8_16x32x1_4x4_4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_128x32x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_128x64x8_32x32x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_128x128x8_32x64x1_8x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_256x32x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_256x64x8_64x32x1_8x8_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_32x64x16_8x16x1_2x2_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_32x128x16_8x32x1_2x4_ using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_64x32x16_16x8x1_2x2_8 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_64x64x8_16x16x1_4x2_4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_64x128x8_16x32x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_64x256x8_16x64x1_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_128x32x16_32x8x1_4x2_ using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_128x64x8_32x16x1_4x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_128x128x8_32x32x1_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_multiplies_ssrgemm_tt_t_256x64x8_64x16x1_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_plus_dsrgemm_nn_n.cu b/bench/device/sm50_simt_minimum_plus_dsrgemm_nn_n.cu index 4a89a3a..f5f7131 100644 --- a/bench/device/sm50_simt_minimum_plus_dsrgemm_nn_n.cu +++ b/bench/device/sm50_simt_minimum_plus_dsrgemm_nn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_n_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_plus_dsrgemm_nn_t.cu b/bench/device/sm50_simt_minimum_plus_dsrgemm_nn_t.cu index 36a8691..3b63d71 100644 --- a/bench/device/sm50_simt_minimum_plus_dsrgemm_nn_t.cu +++ b/bench/device/sm50_simt_minimum_plus_dsrgemm_nn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nn_t_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_plus_dsrgemm_nt_n.cu b/bench/device/sm50_simt_minimum_plus_dsrgemm_nt_n.cu index 783bd30..b2e80af 100644 --- a/bench/device/sm50_simt_minimum_plus_dsrgemm_nt_n.cu +++ b/bench/device/sm50_simt_minimum_plus_dsrgemm_nt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_n_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_plus_dsrgemm_nt_t.cu b/bench/device/sm50_simt_minimum_plus_dsrgemm_nt_t.cu index 9d9a901..d12fe7d 100644 --- a/bench/device/sm50_simt_minimum_plus_dsrgemm_nt_t.cu +++ b/bench/device/sm50_simt_minimum_plus_dsrgemm_nt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_nt_t_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_plus_dsrgemm_tn_n.cu b/bench/device/sm50_simt_minimum_plus_dsrgemm_tn_n.cu index faab463..ec5eaab 100644 --- a/bench/device/sm50_simt_minimum_plus_dsrgemm_tn_n.cu +++ b/bench/device/sm50_simt_minimum_plus_dsrgemm_tn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_n_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_plus_dsrgemm_tn_t.cu b/bench/device/sm50_simt_minimum_plus_dsrgemm_tn_t.cu index 80710e7..2cd6f48 100644 --- a/bench/device/sm50_simt_minimum_plus_dsrgemm_tn_t.cu +++ b/bench/device/sm50_simt_minimum_plus_dsrgemm_tn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tn_t_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_plus_dsrgemm_tt_n.cu b/bench/device/sm50_simt_minimum_plus_dsrgemm_tt_n.cu index 3984e0c..57f26eb 100644 --- a/bench/device/sm50_simt_minimum_plus_dsrgemm_tt_n.cu +++ b/bench/device/sm50_simt_minimum_plus_dsrgemm_tt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_n_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_plus_dsrgemm_tt_t.cu b/bench/device/sm50_simt_minimum_plus_dsrgemm_tt_t.cu index 0ed8bc8..79dff79 100644 --- a/bench/device/sm50_simt_minimum_plus_dsrgemm_tt_t.cu +++ b/bench/device/sm50_simt_minimum_plus_dsrgemm_tt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_plus_dsrgemm_tt_t_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_plus_ssrgemm_nn_n.cu b/bench/device/sm50_simt_minimum_plus_ssrgemm_nn_n.cu index bc3fafe..6c06736 100644 --- a/bench/device/sm50_simt_minimum_plus_ssrgemm_nn_n.cu +++ b/bench/device/sm50_simt_minimum_plus_ssrgemm_nn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_32x64x8_32x64x1_8x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_64x32x8_64x32x1_8x8_8x4_1x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_32x128x8_32x64x1_8x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_64x64x8_64x32x1_8x8_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_64x64x8_32x64x1_8x8_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_128x32x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_64x128x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_128x64x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_32x256x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_64x128x8_32x32x1_8x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_64x256x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_128x128x8_64x32x1_8x8_8x4_2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_128x64x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_128x128x8_32x64x1_8x8_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_256x32x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_256x64x8_64x32x1_8x8_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_64x128x8_16x32x1_4x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_64x256x8_16x64x1_4x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_128x64x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_128x128x8_32x32x1_8x4_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_n_256x64x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_plus_ssrgemm_nn_t.cu b/bench/device/sm50_simt_minimum_plus_ssrgemm_nn_t.cu index 29367c4..2085bec 100644 --- a/bench/device/sm50_simt_minimum_plus_ssrgemm_nn_t.cu +++ b/bench/device/sm50_simt_minimum_plus_ssrgemm_nn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_32x64x8_32x64x1_8x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_64x32x8_64x32x1_8x8_8x4_1x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_32x128x8_32x64x1_8x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_64x64x8_64x32x1_8x8_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_64x64x8_32x64x1_8x8_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_128x32x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_64x128x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_128x64x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_32x256x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_64x128x8_32x32x1_8x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_64x256x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_128x128x8_64x32x1_8x8_8x4_2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_128x64x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_128x128x8_32x64x1_8x8_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_256x32x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_256x64x8_64x32x1_8x8_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_64x128x8_16x32x1_4x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_64x256x8_16x64x1_4x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_128x64x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_128x128x8_32x32x1_8x4_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nn_t_256x64x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_plus_ssrgemm_nt_n.cu b/bench/device/sm50_simt_minimum_plus_ssrgemm_nt_n.cu index e3d8f84..e9a2912 100644 --- a/bench/device/sm50_simt_minimum_plus_ssrgemm_nt_n.cu +++ b/bench/device/sm50_simt_minimum_plus_ssrgemm_nt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_32x64x8_32x64x1_8x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_64x32x8_64x32x1_8x8_8x4_1x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_32x128x8_32x64x1_8x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_64x64x8_64x32x1_8x8_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_64x64x8_32x64x1_8x8_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_128x32x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_64x128x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_128x64x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_32x256x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_64x128x8_32x32x1_8x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_64x256x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_128x128x8_64x32x1_8x8_8x4_2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_128x64x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_128x128x8_32x64x1_8x8_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_256x32x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_256x64x8_64x32x1_8x8_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_64x128x8_16x32x1_4x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_64x256x8_16x64x1_4x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_128x64x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_128x128x8_32x32x1_8x4_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_n_256x64x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_plus_ssrgemm_nt_t.cu b/bench/device/sm50_simt_minimum_plus_ssrgemm_nt_t.cu index 0d9dfc4..742e97c 100644 --- a/bench/device/sm50_simt_minimum_plus_ssrgemm_nt_t.cu +++ b/bench/device/sm50_simt_minimum_plus_ssrgemm_nt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_32x64x8_32x64x1_8x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_64x32x8_64x32x1_8x8_8x4_1x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_32x128x8_32x64x1_8x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_64x64x8_64x32x1_8x8_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_64x64x8_32x64x1_8x8_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_128x32x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_64x128x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_128x64x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_32x256x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_64x128x8_32x32x1_8x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_64x256x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_128x128x8_64x32x1_8x8_8x4_2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_128x64x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_128x128x8_32x64x1_8x8_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_256x32x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_256x64x8_64x32x1_8x8_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_64x128x8_16x32x1_4x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_64x256x8_16x64x1_4x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_128x64x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_128x128x8_32x32x1_8x4_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_nt_t_256x64x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_plus_ssrgemm_tn_n.cu b/bench/device/sm50_simt_minimum_plus_ssrgemm_tn_n.cu index 9ca0344..1584cfc 100644 --- a/bench/device/sm50_simt_minimum_plus_ssrgemm_tn_n.cu +++ b/bench/device/sm50_simt_minimum_plus_ssrgemm_tn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_32x64x8_32x64x1_8x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_64x32x8_64x32x1_8x8_8x4_1x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_32x128x8_32x64x1_8x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_64x64x8_64x32x1_8x8_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_64x64x8_32x64x1_8x8_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_128x32x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_64x128x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_128x64x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_32x256x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_64x128x8_32x32x1_8x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_64x256x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_128x128x8_64x32x1_8x8_8x4_2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_128x64x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_128x128x8_32x64x1_8x8_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_256x32x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_256x64x8_64x32x1_8x8_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_64x128x8_16x32x1_4x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_64x256x8_16x64x1_4x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_128x64x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_128x128x8_32x32x1_8x4_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_n_256x64x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_plus_ssrgemm_tn_t.cu b/bench/device/sm50_simt_minimum_plus_ssrgemm_tn_t.cu index a8481af..f14d74b 100644 --- a/bench/device/sm50_simt_minimum_plus_ssrgemm_tn_t.cu +++ b/bench/device/sm50_simt_minimum_plus_ssrgemm_tn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_32x64x8_32x64x1_8x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_64x32x8_64x32x1_8x8_8x4_1x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_32x128x8_32x64x1_8x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_64x64x8_64x32x1_8x8_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_64x64x8_32x64x1_8x8_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_128x32x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_64x128x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_128x64x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_32x256x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_64x128x8_32x32x1_8x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_64x256x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_128x128x8_64x32x1_8x8_8x4_2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_128x64x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_128x128x8_32x64x1_8x8_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_256x32x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_256x64x8_64x32x1_8x8_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_64x128x8_16x32x1_4x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_64x256x8_16x64x1_4x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_128x64x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_128x128x8_32x32x1_8x4_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tn_t_256x64x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_plus_ssrgemm_tt_n.cu b/bench/device/sm50_simt_minimum_plus_ssrgemm_tt_n.cu index 15e1bc6..01ee21e 100644 --- a/bench/device/sm50_simt_minimum_plus_ssrgemm_tt_n.cu +++ b/bench/device/sm50_simt_minimum_plus_ssrgemm_tt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_32x64x8_32x64x1_8x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_64x32x8_64x32x1_8x8_8x4_1x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_32x128x8_32x64x1_8x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_64x64x8_64x32x1_8x8_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_64x64x8_32x64x1_8x8_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_128x32x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_64x128x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_128x64x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_32x256x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_64x128x8_32x32x1_8x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_64x256x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_128x128x8_64x32x1_8x8_8x4_2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_128x64x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_128x128x8_32x64x1_8x8_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_256x32x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_256x64x8_64x32x1_8x8_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_64x128x8_16x32x1_4x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_64x256x8_16x64x1_4x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_128x64x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_128x128x8_32x32x1_8x4_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_n_256x64x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_minimum_plus_ssrgemm_tt_t.cu b/bench/device/sm50_simt_minimum_plus_ssrgemm_tt_t.cu index bcb72e4..8cb2e95 100644 --- a/bench/device/sm50_simt_minimum_plus_ssrgemm_tt_t.cu +++ b/bench/device/sm50_simt_minimum_plus_ssrgemm_tt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_8x32x8_8x32x1_2x4_4x8_1x1(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_16x32x8_16x32x1_4x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_16x64x8_16x64x1_4x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_32x32x8_32x32x1_8x4_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_32x64x8_32x64x1_8x8_4x8_1x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_64x32x8_64x32x1_8x8_8x4_1x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_8x32x8_8x16x1_2x2_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_8x64x8_8x32x1_2x4_4x8_1x2(b using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_16x32x8_16x16x1_4x2_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_16x64x8_16x32x1_4x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_16x128x8_16x64x1_4x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_32x32x8_32x16x1_4x4_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_32x64x8_32x32x1_8x4_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_32x128x8_32x64x1_8x8_4x8_1x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_64x64x8_64x32x1_8x8_8x4_1x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_32x32x8_16x32x1_4x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_64x32x8_32x32x1_8x4_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_64x64x8_32x64x1_8x8_4x8_2x1 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_128x32x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_16x32x8_8x16x1_2x2_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_16x64x8_8x32x1_2x4_4x8_2x2( using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_32x32x8_16x16x1_4x2_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_32x64x8_16x32x1_4x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_32x128x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_64x32x8_32x16x1_4x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_64x64x8_32x32x1_8x4_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_64x128x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_128x32x8_64x16x1_8x4_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_128x64x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_16x64x16_8x16x1_2x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_16x128x16_8x32x1_2x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_32x32x8_16x8x1_2x2_8x4_2x4( using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_32x64x8_16x16x1_4x2_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_32x128x8_16x32x1_4x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_32x256x8_16x64x1_4x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_64x64x8_32x16x1_4x4_8x4_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_64x128x8_32x32x1_8x4_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_64x256x8_32x64x1_8x8_4x8_2x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_128x128x8_64x32x1_8x8_8x4_2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_32x32x8_8x16x1_2x2_4x8_4x2( using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_64x32x8_16x16x1_4x2_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_64x64x8_16x32x1_4x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_128x32x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_128x64x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_128x128x8_32x64x1_8x8_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_256x32x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_256x64x8_64x32x1_8x8_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_32x64x16_8x16x1_2x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_32x128x16_8x32x1_2x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_64x32x16_16x8x1_2x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_64x64x8_16x16x1_4x2_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_64x128x8_16x32x1_4x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_64x256x8_16x64x1_4x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_128x32x16_32x8x1_4x2_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_128x64x8_32x16x1_4x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_128x128x8_32x32x1_8x4_4x8_4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_minimum_plus_ssrgemm_tt_t_256x64x8_64x16x1_8x4_8x4_4x using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_plus_multiplies_dsrgemm_nn_n.cu b/bench/device/sm50_simt_plus_multiplies_dsrgemm_nn_n.cu index b84e746..6739ecd 100644 --- a/bench/device/sm50_simt_plus_multiplies_dsrgemm_nn_n.cu +++ b/bench/device/sm50_simt_plus_multiplies_dsrgemm_nn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_plus_multiplies_dsrgemm_nn_t.cu b/bench/device/sm50_simt_plus_multiplies_dsrgemm_nn_t.cu index ca2fe72..a5d2cff 100644 --- a/bench/device/sm50_simt_plus_multiplies_dsrgemm_nn_t.cu +++ b/bench/device/sm50_simt_plus_multiplies_dsrgemm_nn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nn_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_plus_multiplies_dsrgemm_nt_n.cu b/bench/device/sm50_simt_plus_multiplies_dsrgemm_nt_n.cu index f9f4901..0f9fac1 100644 --- a/bench/device/sm50_simt_plus_multiplies_dsrgemm_nt_n.cu +++ b/bench/device/sm50_simt_plus_multiplies_dsrgemm_nt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_plus_multiplies_dsrgemm_nt_t.cu b/bench/device/sm50_simt_plus_multiplies_dsrgemm_nt_t.cu index 19a0ba9..a2b1095 100644 --- a/bench/device/sm50_simt_plus_multiplies_dsrgemm_nt_t.cu +++ b/bench/device/sm50_simt_plus_multiplies_dsrgemm_nt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_nt_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_plus_multiplies_dsrgemm_tn_n.cu b/bench/device/sm50_simt_plus_multiplies_dsrgemm_tn_n.cu index bb34240..5761ed4 100644 --- a/bench/device/sm50_simt_plus_multiplies_dsrgemm_tn_n.cu +++ b/bench/device/sm50_simt_plus_multiplies_dsrgemm_tn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_plus_multiplies_dsrgemm_tn_t.cu b/bench/device/sm50_simt_plus_multiplies_dsrgemm_tn_t.cu index cd96536..f7f5940 100644 --- a/bench/device/sm50_simt_plus_multiplies_dsrgemm_tn_t.cu +++ b/bench/device/sm50_simt_plus_multiplies_dsrgemm_tn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tn_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_plus_multiplies_dsrgemm_tt_n.cu b/bench/device/sm50_simt_plus_multiplies_dsrgemm_tt_n.cu index b20eadb..fa0e7ad 100644 --- a/bench/device/sm50_simt_plus_multiplies_dsrgemm_tt_n.cu +++ b/bench/device/sm50_simt_plus_multiplies_dsrgemm_tt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_plus_multiplies_dsrgemm_tt_t.cu b/bench/device/sm50_simt_plus_multiplies_dsrgemm_tt_t.cu index 2cb9c1a..c6a4482 100644 --- a/bench/device/sm50_simt_plus_multiplies_dsrgemm_tt_t.cu +++ b/bench/device/sm50_simt_plus_multiplies_dsrgemm_tt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_plus_multiplies_dsrgemm_tt_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_plus_multiplies_ssrgemm_nn_n.cu b/bench/device/sm50_simt_plus_multiplies_ssrgemm_nn_n.cu index d6d2dbb..45e77d2 100644 --- a/bench/device/sm50_simt_plus_multiplies_ssrgemm_nn_n.cu +++ b/bench/device/sm50_simt_plus_multiplies_ssrgemm_nn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_n_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_plus_multiplies_ssrgemm_nn_t.cu b/bench/device/sm50_simt_plus_multiplies_ssrgemm_nn_t.cu index 1ad881f..c6a3ed6 100644 --- a/bench/device/sm50_simt_plus_multiplies_ssrgemm_nn_t.cu +++ b/bench/device/sm50_simt_plus_multiplies_ssrgemm_nn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nn_t_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_plus_multiplies_ssrgemm_nt_n.cu b/bench/device/sm50_simt_plus_multiplies_ssrgemm_nt_n.cu index f1da382..0988771 100644 --- a/bench/device/sm50_simt_plus_multiplies_ssrgemm_nt_n.cu +++ b/bench/device/sm50_simt_plus_multiplies_ssrgemm_nt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_n_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_plus_multiplies_ssrgemm_nt_t.cu b/bench/device/sm50_simt_plus_multiplies_ssrgemm_nt_t.cu index eece74e..35c831a 100644 --- a/bench/device/sm50_simt_plus_multiplies_ssrgemm_nt_t.cu +++ b/bench/device/sm50_simt_plus_multiplies_ssrgemm_nt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_nt_t_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_plus_multiplies_ssrgemm_tn_n.cu b/bench/device/sm50_simt_plus_multiplies_ssrgemm_tn_n.cu index 31b1e5d..fb54897 100644 --- a/bench/device/sm50_simt_plus_multiplies_ssrgemm_tn_n.cu +++ b/bench/device/sm50_simt_plus_multiplies_ssrgemm_tn_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_n_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_plus_multiplies_ssrgemm_tn_t.cu b/bench/device/sm50_simt_plus_multiplies_ssrgemm_tn_t.cu index 5c0fda3..de60c06 100644 --- a/bench/device/sm50_simt_plus_multiplies_ssrgemm_tn_t.cu +++ b/bench/device/sm50_simt_plus_multiplies_ssrgemm_tn_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tn_t_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_plus_multiplies_ssrgemm_tt_n.cu b/bench/device/sm50_simt_plus_multiplies_ssrgemm_tt_n.cu index 07fa1aa..b2180da 100644 --- a/bench/device/sm50_simt_plus_multiplies_ssrgemm_tt_n.cu +++ b/bench/device/sm50_simt_plus_multiplies_ssrgemm_tt_n.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_n_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/bench/device/sm50_simt_plus_multiplies_ssrgemm_tt_t.cu b/bench/device/sm50_simt_plus_multiplies_ssrgemm_tt_t.cu index 8631856..dcf3f5e 100644 --- a/bench/device/sm50_simt_plus_multiplies_ssrgemm_tt_t.cu +++ b/bench/device/sm50_simt_plus_multiplies_ssrgemm_tt_t.cu @@ -29,9 +29,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_8x32x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -79,9 +79,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_16x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -129,9 +129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_16x64x8_16x64x1_4x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -179,9 +179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_32x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -229,9 +229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_32x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -279,9 +279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_64x32x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -329,9 +329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_8x32x8_8x16x1_2x2_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -379,9 +379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_8x64x8_8x32x1_2x4_4x8_1x using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -429,9 +429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_16x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -479,9 +479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_16x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -529,9 +529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_16x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -579,9 +579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_32x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -629,9 +629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_32x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -679,9 +679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_32x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -729,9 +729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_64x64x8_64x32x1_8x8_8x4_ using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -779,9 +779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_32x32x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -829,9 +829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_64x32x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -879,9 +879,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_64x64x8_32x64x1_8x8_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -929,9 +929,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_128x32x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -979,9 +979,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_16x32x8_8x16x1_2x2_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1029,9 +1029,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_16x64x8_8x32x1_2x4_4x8_2 using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1079,9 +1079,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_32x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1129,9 +1129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_32x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1179,9 +1179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_32x128x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1229,9 +1229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_64x32x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1279,9 +1279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_64x64x8_32x32x1_8x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1329,9 +1329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_64x128x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1379,9 +1379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_128x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1429,9 +1429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_128x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1479,9 +1479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_16x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1529,9 +1529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_16x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1579,9 +1579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_32x32x8_16x8x1_2x2_8x4_2 using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1629,9 +1629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_32x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1679,9 +1679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_32x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1729,9 +1729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_32x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1779,9 +1779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_64x64x8_32x16x1_4x4_8x4_ using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1829,9 +1829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_64x128x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1879,9 +1879,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_64x256x8_32x64x1_8x8_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1929,9 +1929,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_128x128x8_64x32x1_8x8_8x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1979,9 +1979,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_32x32x8_8x16x1_2x2_4x8_4 using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2029,9 +2029,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_64x32x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2079,9 +2079,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_64x64x8_16x32x1_4x4_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2129,9 +2129,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_128x32x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2179,9 +2179,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_128x64x8_32x32x1_8x4_4x8 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2229,9 +2229,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_128x128x8_32x64x1_8x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2279,9 +2279,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_256x32x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2329,9 +2329,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_256x64x8_64x32x1_8x8_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2379,9 +2379,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_32x64x16_8x16x1_2x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2429,9 +2429,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_32x128x16_8x32x1_2x4_4x8 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2479,9 +2479,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_64x32x16_16x8x1_2x2_8x4_ using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2529,9 +2529,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_64x64x8_16x16x1_4x2_4x8_ using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2579,9 +2579,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_64x128x8_16x32x1_4x4_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2629,9 +2629,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_64x256x8_16x64x1_4x8_4x8 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2679,9 +2679,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_128x32x16_32x8x1_4x2_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2729,9 +2729,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_128x64x8_32x16x1_4x4_8x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2779,9 +2779,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_128x128x8_32x32x1_8x4_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2829,9 +2829,9 @@ static void BM_SM50_device_plus_multiplies_ssrgemm_tt_t_256x64x8_64x16x1_8x4_8x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/include/cuasr/gemm/device/default_srgemm_configuration.h b/include/cuasr/gemm/device/default_srgemm_configuration.h index 3c9bdc8..9237353 100644 --- a/include/cuasr/gemm/device/default_srgemm_configuration.h +++ b/include/cuasr/gemm/device/default_srgemm_configuration.h @@ -30,13 +30,15 @@ template < typename ElementB, typename ElementC, typename ElementAccumulator, - typename OperatorClass, typename AdditionOp, typename MultiplicationOp, + typename OperatorClass, typename ArchTag > struct DefaultSemiRingConfiguration; +//////////////////////////////////////////////////////////////////////////////// +/////////////////////////////////// SM 50 ////////////////////////////////////// //////////////////////////////////////////////////////////////////////////////// // Plus-Times semi-ring GEMM configuration @@ -50,9 +52,9 @@ struct DefaultSemiRingConfiguration< Element, Element, Element, - cutlass::arch::OpClassSimt, cuasr::plus, cuasr::multiplies, + cutlass::arch::OpClassSimt, ArchTag> { static int constexpr kAlignmentA = 1; @@ -80,9 +82,9 @@ struct DefaultSemiRingConfiguration< Element, Element, Element, - cutlass::arch::OpClassSimt, cuasr::minimum, cuasr::plus, + cutlass::arch::OpClassSimt, ArchTag> { static int constexpr kAlignmentA = 1; @@ -110,9 +112,9 @@ struct DefaultSemiRingConfiguration< Element, Element, Element, - cutlass::arch::OpClassSimt, cuasr::maximum, cuasr::plus, + cutlass::arch::OpClassSimt, ArchTag> { static int constexpr kAlignmentA = 1; @@ -139,9 +141,9 @@ struct DefaultSemiRingConfiguration< Element, Element, Element, - cutlass::arch::OpClassSimt, cuasr::maximum, cuasr::minimum, + cutlass::arch::OpClassSimt, ArchTag> { static int constexpr kAlignmentA = 1; @@ -168,9 +170,9 @@ struct DefaultSemiRingConfiguration< Element, Element, Element, - cutlass::arch::OpClassSimt, cuasr::minimum, cuasr::maximum, + cutlass::arch::OpClassSimt, ArchTag> { static int constexpr kAlignmentA = 1; @@ -197,9 +199,9 @@ struct DefaultSemiRingConfiguration< Element, Element, Element, - cutlass::arch::OpClassSimt, cuasr::minimum, cuasr::multiplies, + cutlass::arch::OpClassSimt, ArchTag> { static int constexpr kAlignmentA = 1; @@ -226,9 +228,9 @@ struct DefaultSemiRingConfiguration< Element, Element, Element, - cutlass::arch::OpClassSimt, cuasr::maximum, cuasr::multiplies, + cutlass::arch::OpClassSimt, ArchTag> { static int constexpr kAlignmentA = 1; @@ -255,9 +257,9 @@ struct DefaultSemiRingConfiguration< Element, Element, Element, - cutlass::arch::OpClassSimt, cuasr::binary_or, cuasr::binary_and, + cutlass::arch::OpClassSimt, ArchTag> { static int constexpr kAlignmentA = 1; @@ -275,6 +277,9 @@ struct DefaultSemiRingConfiguration< }; //////////////////////////////////////////////////////////////////////////////// +/////////////////////////////////// SM 80 ////////////////////////////////////// +//////////////////////////////////////////////////////////////////////////////// + } // namespace device } // namespace gemm diff --git a/include/cuasr/gemm/device/srgemm.h b/include/cuasr/gemm/device/srgemm.h index 50482ff..6b23b1b 100644 --- a/include/cuasr/gemm/device/srgemm.h +++ b/include/cuasr/gemm/device/srgemm.h @@ -51,34 +51,34 @@ template < /// Threadblock-level tile size (concept: GemmShape) typename ThreadblockShape_ = typename DefaultSemiRingConfiguration< ElementA_, ElementB_, ElementC_, ElementAccumulator_, - OperatorClass_, AdditionOp_, MultiplicationOp_, ArchTag_>::ThreadblockShape, + AdditionOp_, MultiplicationOp_, OperatorClass_, ArchTag_>::ThreadblockShape, /// Warp-level tile size (concept: GemmShape) typename WarpShape_ = typename DefaultSemiRingConfiguration< ElementA_, ElementB_, ElementC_, ElementAccumulator_, - OperatorClass_, AdditionOp_, MultiplicationOp_, ArchTag_>::WarpShape, + AdditionOp_, MultiplicationOp_, OperatorClass_, ArchTag_>::WarpShape, /// Instruction-level tile size (concept: GemmShape) typename InstructionShape_ = typename DefaultSemiRingConfiguration< ElementA_, ElementB_, ElementC_, ElementAccumulator_, - OperatorClass_, AdditionOp_, MultiplicationOp_, ArchTag_>::InstructionShape, + AdditionOp_, MultiplicationOp_, OperatorClass_, ArchTag_>::InstructionShape, /// Epilogue output operator typename EpilogueOutputOp_ = typename DefaultSemiRingConfiguration< ElementA_, ElementB_, ElementC_, ElementAccumulator_, - OperatorClass_, AdditionOp_, MultiplicationOp_, ArchTag_>::EpilogueOutputOp, + AdditionOp_, MultiplicationOp_, OperatorClass_, ArchTag_>::EpilogueOutputOp, /// Threadblock-level swizzling operator typename ThreadblockSwizzle_ = typename cutlass::gemm::threadblock::GemmIdentityThreadblockSwizzle<>, /// Number of stages used in the pipelined mainloop int Stages = DefaultSemiRingConfiguration< ElementA_, ElementB_, ElementC_, ElementAccumulator_, - OperatorClass_, AdditionOp_, MultiplicationOp_, ArchTag_>::kStages, + AdditionOp_, MultiplicationOp_, OperatorClass_, ArchTag_>::kStages, /// Access granularity of A matrix in units of elements int AlignmentA = DefaultSemiRingConfiguration< ElementA_, ElementB_, ElementC_, ElementAccumulator_, - OperatorClass_, AdditionOp_, MultiplicationOp_, ArchTag_>::kAlignmentA, + AdditionOp_, MultiplicationOp_, OperatorClass_, ArchTag_>::kAlignmentA, /// Access granularity of B matrix in units of elements int AlignmentB = DefaultSemiRingConfiguration< ElementA_, ElementB_, ElementC_, ElementAccumulator_, - OperatorClass_, AdditionOp_, MultiplicationOp_, ArchTag_>::kAlignmentB, + AdditionOp_, MultiplicationOp_, OperatorClass_, ArchTag_>::kAlignmentB, /// If true, kernel supports split-K with serial reduction bool SplitKSerial = false > diff --git a/include/cuasr/gemm/device/srgemm_splitk_parallel.h b/include/cuasr/gemm/device/srgemm_splitk_parallel.h index b88a522..dcfc0b9 100644 --- a/include/cuasr/gemm/device/srgemm_splitk_parallel.h +++ b/include/cuasr/gemm/device/srgemm_splitk_parallel.h @@ -59,24 +59,24 @@ template < /// Threadblock-level tile size (concept: GemmShape) typename ThreadblockShape_ = typename DefaultSemiRingConfiguration< ElementA_, ElementB_, ElementC_, ElementAccumulator_, - OperatorClass_, AdditionOp_, MultiplicationOp_, ArchTag_>::ThreadblockShape, + AdditionOp_, MultiplicationOp_, OperatorClass_, ArchTag_>::ThreadblockShape, /// Warp-level tile size (concept: GemmShape) typename WarpShape_ = typename DefaultSemiRingConfiguration< ElementA_, ElementB_, ElementC_, ElementAccumulator_, - OperatorClass_, AdditionOp_, MultiplicationOp_, ArchTag_>::WarpShape, + AdditionOp_, MultiplicationOp_, OperatorClass_, ArchTag_>::WarpShape, /// Instruction-level tile size (concept: GemmShape) typename InstructionShape_ = typename DefaultSemiRingConfiguration< ElementA_, ElementB_, ElementC_, ElementAccumulator_, - OperatorClass_, AdditionOp_, MultiplicationOp_, ArchTag_>::InstructionShape, + AdditionOp_, MultiplicationOp_, OperatorClass_, ArchTag_>::InstructionShape, /// Epilogue output operator typename EpilogueOutputOp_ = typename DefaultSemiRingConfiguration< ElementA_, ElementB_, ElementC_, ElementAccumulator_, - OperatorClass_, AdditionOp_, MultiplicationOp_, ArchTag_>::EpilogueOutputOp, + AdditionOp_, MultiplicationOp_, OperatorClass_, ArchTag_>::EpilogueOutputOp, /// Epilogue conversion operator typename ConvertScaledOp_ = cutlass::epilogue::thread::Convert< ElementAccumulator_, DefaultSemiRingConfiguration< ElementA_, ElementB_, ElementC_, ElementAccumulator_, - OperatorClass_, AdditionOp_, MultiplicationOp_, ArchTag_>::EpilogueOutputOp::kCount, + AdditionOp_, MultiplicationOp_, OperatorClass_, ArchTag_>::EpilogueOutputOp::kCount, ElementAccumulator_>, /// Reduction operator typename ReductionOp_ = cuasr::reduction::thread::SemiringReduce< @@ -88,15 +88,15 @@ template < /// Number of stages used in the pipelined mainloop int Stages = DefaultSemiRingConfiguration< ElementA_, ElementB_, ElementC_, ElementAccumulator_, - OperatorClass_, AdditionOp_, MultiplicationOp_, ArchTag_>::kStages, + AdditionOp_, MultiplicationOp_, OperatorClass_, ArchTag_>::kStages, /// Access granularity of A matrix in units of elements int kAlignmentA = DefaultSemiRingConfiguration< ElementA_, ElementB_, ElementC_, ElementAccumulator_, - OperatorClass_, AdditionOp_, MultiplicationOp_, ArchTag_>::kAlignmentA, + AdditionOp_, MultiplicationOp_, OperatorClass_, ArchTag_>::kAlignmentA, /// Access granularity of B matrix in units of elements int kAlignmentB = DefaultSemiRingConfiguration< ElementA_, ElementB_, ElementC_, ElementAccumulator_, - OperatorClass_, AdditionOp_, MultiplicationOp_, ArchTag_>::kAlignmentB + AdditionOp_, MultiplicationOp_, OperatorClass_, ArchTag_>::kAlignmentB > class SrgemmSplitKParallel { public: diff --git a/test/device/gen_simt.py b/test/device/gen_simt.py index 52678f0..7cda853 100644 --- a/test/device/gen_simt.py +++ b/test/device/gen_simt.py @@ -103,9 +103,9 @@ using WarpShape = cutlass::gemm::GemmShape<{13}, {14}, {12}>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::{0}, cuasr::{1}, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::{0}, cuasr::{1}, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_n.cu b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_n.cu index 6e0e06d..1ab2c24 100644 --- a/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_n.cu +++ b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 16x32x8_16x32x1_4x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 16x64x8_16x64x1_4x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 32x32x8_32x32x1_8x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 16x32x8_16x16x1_4x2_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 16x64x8_16x32x1_4x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 16x128x8_16x64x1_4x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 32x32x8_32x16x1_4x4_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 32x64x8_32x32x1_8x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 32x32x8_16x32x1_4x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 64x32x8_32x32x1_8x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 16x32x8_8x16x1_2x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 16x64x8_8x32x1_2x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 32x32x8_16x16x1_4x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 32x64x8_16x32x1_4x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 32x128x8_16x64x1_4x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 64x32x8_32x16x1_4x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 64x64x8_32x32x1_8x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 128x32x8_64x16x1_8x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 16x64x16_8x16x1_2x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 16x128x16_8x32x1_2x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 32x32x8_16x8x1_2x2_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 32x64x8_16x16x1_4x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 32x128x8_16x32x1_4x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 64x64x8_32x16x1_4x4_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 32x32x8_8x16x1_2x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 64x32x8_16x16x1_4x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 64x64x8_16x32x1_4x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 128x32x8_32x16x1_4x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 32x64x16_8x16x1_2x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 32x128x16_8x32x1_2x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 64x32x16_16x8x1_2x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 64x64x8_16x16x1_4x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, 128x32x16_32x8x1_4x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_t.cu b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_t.cu index 48e3855..c74b6fa 100644 --- a/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_t.cu +++ b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 16x32x8_16x32x1_4x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 16x64x8_16x64x1_4x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 32x32x8_32x32x1_8x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 16x32x8_16x16x1_4x2_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 16x64x8_16x32x1_4x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 16x128x8_16x64x1_4x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 32x32x8_32x16x1_4x4_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 32x64x8_32x32x1_8x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 32x32x8_16x32x1_4x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 64x32x8_32x32x1_8x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 16x32x8_8x16x1_2x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 16x64x8_8x32x1_2x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 32x32x8_16x16x1_4x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 32x64x8_16x32x1_4x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 32x128x8_16x64x1_4x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 64x32x8_32x16x1_4x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 64x64x8_32x32x1_8x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 128x32x8_64x16x1_8x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 16x64x16_8x16x1_2x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 16x128x16_8x32x1_2x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 32x32x8_16x8x1_2x2_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 32x64x8_16x16x1_4x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 32x128x8_16x32x1_4x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 64x64x8_32x16x1_4x4_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 32x32x8_8x16x1_2x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 64x32x8_16x16x1_4x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 64x64x8_16x32x1_4x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 128x32x8_32x16x1_4x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 32x64x16_8x16x1_2x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 32x128x16_8x32x1_2x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 64x32x16_16x8x1_2x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 64x64x8_16x16x1_4x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, 128x32x16_32x8x1_4x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_n.cu b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_n.cu index a4e49ed..a2f3314 100644 --- a/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_n.cu +++ b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 16x32x8_16x32x1_4x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 16x64x8_16x64x1_4x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 32x32x8_32x32x1_8x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 16x32x8_16x16x1_4x2_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 16x64x8_16x32x1_4x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 16x128x8_16x64x1_4x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 32x32x8_32x16x1_4x4_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 32x64x8_32x32x1_8x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 32x32x8_16x32x1_4x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 64x32x8_32x32x1_8x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 16x32x8_8x16x1_2x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 16x64x8_8x32x1_2x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 32x32x8_16x16x1_4x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 32x64x8_16x32x1_4x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 32x128x8_16x64x1_4x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 64x32x8_32x16x1_4x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 64x64x8_32x32x1_8x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 128x32x8_64x16x1_8x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 16x64x16_8x16x1_2x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 16x128x16_8x32x1_2x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 32x32x8_16x8x1_2x2_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 32x64x8_16x16x1_4x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 32x128x8_16x32x1_4x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 64x64x8_32x16x1_4x4_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 32x32x8_8x16x1_2x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 64x32x8_16x16x1_4x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 64x64x8_16x32x1_4x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 128x32x8_32x16x1_4x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 32x64x16_8x16x1_2x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 32x128x16_8x32x1_2x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 64x32x16_16x8x1_2x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 64x64x8_16x16x1_4x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, 128x32x16_32x8x1_4x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_t.cu b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_t.cu index 4c21b98..4860b5c 100644 --- a/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_t.cu +++ b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_nt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 16x32x8_16x32x1_4x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 16x64x8_16x64x1_4x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 32x32x8_32x32x1_8x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 16x32x8_16x16x1_4x2_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 16x64x8_16x32x1_4x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 16x128x8_16x64x1_4x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 32x32x8_32x16x1_4x4_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 32x64x8_32x32x1_8x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 32x32x8_16x32x1_4x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 64x32x8_32x32x1_8x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 16x32x8_8x16x1_2x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 16x64x8_8x32x1_2x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 32x32x8_16x16x1_4x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 32x64x8_16x32x1_4x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 32x128x8_16x64x1_4x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 64x32x8_32x16x1_4x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 64x64x8_32x32x1_8x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 128x32x8_64x16x1_8x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 16x64x16_8x16x1_2x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 16x128x16_8x32x1_2x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 32x32x8_16x8x1_2x2_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 32x64x8_16x16x1_4x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 32x128x8_16x32x1_4x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 64x64x8_32x16x1_4x4_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 32x32x8_8x16x1_2x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 64x32x8_16x16x1_4x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 64x64x8_16x32x1_4x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 128x32x8_32x16x1_4x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 32x64x16_8x16x1_2x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 32x128x16_8x32x1_2x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 64x32x16_16x8x1_2x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 64x64x8_16x16x1_4x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, 128x32x16_32x8x1_4x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_n.cu b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_n.cu index 8ceca1d..db191a5 100644 --- a/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_n.cu +++ b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 16x32x8_16x32x1_4x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 16x64x8_16x64x1_4x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 32x32x8_32x32x1_8x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 16x32x8_16x16x1_4x2_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 16x64x8_16x32x1_4x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 16x128x8_16x64x1_4x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 32x32x8_32x16x1_4x4_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 32x64x8_32x32x1_8x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 32x32x8_16x32x1_4x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 64x32x8_32x32x1_8x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 16x32x8_8x16x1_2x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 16x64x8_8x32x1_2x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 32x32x8_16x16x1_4x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 32x64x8_16x32x1_4x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 32x128x8_16x64x1_4x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 64x32x8_32x16x1_4x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 64x64x8_32x32x1_8x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 128x32x8_64x16x1_8x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 16x64x16_8x16x1_2x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 16x128x16_8x32x1_2x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 32x32x8_16x8x1_2x2_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 32x64x8_16x16x1_4x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 32x128x8_16x32x1_4x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 64x64x8_32x16x1_4x4_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 32x32x8_8x16x1_2x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 64x32x8_16x16x1_4x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 64x64x8_16x32x1_4x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 128x32x8_32x16x1_4x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 32x64x16_8x16x1_2x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 32x128x16_8x32x1_2x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 64x32x16_16x8x1_2x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 64x64x8_16x16x1_4x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, 128x32x16_32x8x1_4x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_t.cu b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_t.cu index f6dd6d6..2216786 100644 --- a/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_t.cu +++ b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 16x32x8_16x32x1_4x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 16x64x8_16x64x1_4x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 32x32x8_32x32x1_8x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 16x32x8_16x16x1_4x2_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 16x64x8_16x32x1_4x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 16x128x8_16x64x1_4x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 32x32x8_32x16x1_4x4_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 32x64x8_32x32x1_8x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 32x32x8_16x32x1_4x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 64x32x8_32x32x1_8x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 16x32x8_8x16x1_2x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 16x64x8_8x32x1_2x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 32x32x8_16x16x1_4x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 32x64x8_16x32x1_4x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 32x128x8_16x64x1_4x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 64x32x8_32x16x1_4x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 64x64x8_32x32x1_8x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 128x32x8_64x16x1_8x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 16x64x16_8x16x1_2x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 16x128x16_8x32x1_2x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 32x32x8_16x8x1_2x2_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 32x64x8_16x16x1_4x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 32x128x8_16x32x1_4x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 64x64x8_32x16x1_4x4_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 32x32x8_8x16x1_2x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 64x32x8_16x16x1_4x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 64x64x8_16x32x1_4x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 128x32x8_32x16x1_4x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 32x64x16_8x16x1_2x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 32x128x16_8x32x1_2x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 64x32x16_16x8x1_2x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 64x64x8_16x16x1_4x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, 128x32x16_32x8x1_4x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_n.cu b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_n.cu index 49958ad..0771a23 100644 --- a/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_n.cu +++ b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 16x32x8_16x32x1_4x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 16x64x8_16x64x1_4x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 32x32x8_32x32x1_8x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 16x32x8_16x16x1_4x2_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 16x64x8_16x32x1_4x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 16x128x8_16x64x1_4x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 32x32x8_32x16x1_4x4_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 32x64x8_32x32x1_8x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 32x32x8_16x32x1_4x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 64x32x8_32x32x1_8x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 16x32x8_8x16x1_2x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 16x64x8_8x32x1_2x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 32x32x8_16x16x1_4x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 32x64x8_16x32x1_4x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 32x128x8_16x64x1_4x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 64x32x8_32x16x1_4x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 64x64x8_32x32x1_8x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 128x32x8_64x16x1_8x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 16x64x16_8x16x1_2x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 16x128x16_8x32x1_2x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 32x32x8_16x8x1_2x2_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 32x64x8_16x16x1_4x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 32x128x8_16x32x1_4x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 64x64x8_32x16x1_4x4_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 32x32x8_8x16x1_2x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 64x32x8_16x16x1_4x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 64x64x8_16x32x1_4x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 128x32x8_32x16x1_4x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 32x64x16_8x16x1_2x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 32x128x16_8x32x1_2x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 64x32x16_16x8x1_2x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 64x64x8_16x16x1_4x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, 128x32x16_32x8x1_4x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_t.cu b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_t.cu index 006cac2..f4cee74 100644 --- a/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_t.cu +++ b/test/device/sm50_simt_binary_or_binary_and_dsrgemm_tt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 16x32x8_16x32x1_4x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 16x64x8_16x64x1_4x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 32x32x8_32x32x1_8x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 16x32x8_16x16x1_4x2_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 16x64x8_16x32x1_4x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 16x128x8_16x64x1_4x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 32x32x8_32x16x1_4x4_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 32x64x8_32x32x1_8x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 32x32x8_16x32x1_4x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 64x32x8_32x32x1_8x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 16x32x8_8x16x1_2x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 16x64x8_8x32x1_2x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 32x32x8_16x16x1_4x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 32x64x8_16x32x1_4x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 32x128x8_16x64x1_4x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 64x32x8_32x16x1_4x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 64x64x8_32x32x1_8x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 128x32x8_64x16x1_8x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 16x64x16_8x16x1_2x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 16x128x16_8x32x1_2x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 32x32x8_16x8x1_2x2_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 32x64x8_16x16x1_4x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 32x128x8_16x32x1_4x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 64x64x8_32x16x1_4x4_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 32x32x8_8x16x1_2x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 64x32x8_16x16x1_4x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 64x64x8_16x32x1_4x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 128x32x8_32x16x1_4x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 32x64x16_8x16x1_2x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 32x128x16_8x32x1_2x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 64x32x16_16x8x1_2x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 64x64x8_16x16x1_4x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, 128x32x16_32x8x1_4x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_n.cu b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_n.cu index 17176dd..88ff931 100644 --- a/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_n.cu +++ b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 16x32x8_16x32x1_4x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 16x64x8_16x64x1_4x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 32x32x8_32x32x1_8x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 32x64x8_32x64x1_8x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 64x32x8_64x32x1_8x8_8x4_1x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 16x32x8_16x16x1_4x2_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 16x64x8_16x32x1_4x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 16x128x8_16x64x1_4x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 32x32x8_32x16x1_4x4_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 32x64x8_32x32x1_8x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 32x128x8_32x64x1_8x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 64x64x8_64x32x1_8x8_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 32x32x8_16x32x1_4x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 64x32x8_32x32x1_8x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 64x64x8_32x64x1_8x8_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 128x32x8_64x32x1_8x8_8x4_2x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 16x32x8_8x16x1_2x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 16x64x8_8x32x1_2x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 32x32x8_16x16x1_4x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 32x64x8_16x32x1_4x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 32x128x8_16x64x1_4x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 64x32x8_32x16x1_4x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 64x64x8_32x32x1_8x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 64x128x8_32x64x1_8x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 128x32x8_64x16x1_8x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 128x64x8_64x32x1_8x8_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 16x64x16_8x16x1_2x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 16x128x16_8x32x1_2x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 32x32x8_16x8x1_2x2_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 32x64x8_16x16x1_4x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 32x128x8_16x32x1_4x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 32x256x8_16x64x1_4x8_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 64x64x8_32x16x1_4x4_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 64x128x8_32x32x1_8x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 64x256x8_32x64x1_8x8_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 128x128x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 32x32x8_8x16x1_2x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 64x32x8_16x16x1_4x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 64x64x8_16x32x1_4x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 128x32x8_32x16x1_4x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 128x64x8_32x32x1_8x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 128x128x8_32x64x1_8x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 256x32x8_64x16x1_8x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 256x64x8_64x32x1_8x8_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 32x64x16_8x16x1_2x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 32x128x16_8x32x1_2x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 64x32x16_16x8x1_2x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 64x64x8_16x16x1_4x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 64x128x8_16x32x1_4x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 64x256x8_16x64x1_4x8_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 128x32x16_32x8x1_4x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 128x64x8_32x16x1_4x4_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 128x128x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, 256x64x8_64x16x1_8x4_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_t.cu b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_t.cu index 7bededb..624b452 100644 --- a/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_t.cu +++ b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 16x32x8_16x32x1_4x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 16x64x8_16x64x1_4x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 32x32x8_32x32x1_8x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 32x64x8_32x64x1_8x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 64x32x8_64x32x1_8x8_8x4_1x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 16x32x8_16x16x1_4x2_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 16x64x8_16x32x1_4x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 16x128x8_16x64x1_4x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 32x32x8_32x16x1_4x4_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 32x64x8_32x32x1_8x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 32x128x8_32x64x1_8x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 64x64x8_64x32x1_8x8_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 32x32x8_16x32x1_4x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 64x32x8_32x32x1_8x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 64x64x8_32x64x1_8x8_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 128x32x8_64x32x1_8x8_8x4_2x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 16x32x8_8x16x1_2x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 16x64x8_8x32x1_2x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 32x32x8_16x16x1_4x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 32x64x8_16x32x1_4x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 32x128x8_16x64x1_4x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 64x32x8_32x16x1_4x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 64x64x8_32x32x1_8x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 64x128x8_32x64x1_8x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 128x32x8_64x16x1_8x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 128x64x8_64x32x1_8x8_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 16x64x16_8x16x1_2x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 16x128x16_8x32x1_2x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 32x32x8_16x8x1_2x2_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 32x64x8_16x16x1_4x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 32x128x8_16x32x1_4x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 32x256x8_16x64x1_4x8_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 64x64x8_32x16x1_4x4_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 64x128x8_32x32x1_8x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 64x256x8_32x64x1_8x8_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 128x128x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 32x32x8_8x16x1_2x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 64x32x8_16x16x1_4x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 64x64x8_16x32x1_4x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 128x32x8_32x16x1_4x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 128x64x8_32x32x1_8x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 128x128x8_32x64x1_8x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 256x32x8_64x16x1_8x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 256x64x8_64x32x1_8x8_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 32x64x16_8x16x1_2x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 32x128x16_8x32x1_2x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 64x32x16_16x8x1_2x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 64x64x8_16x16x1_4x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 64x128x8_16x32x1_4x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 64x256x8_16x64x1_4x8_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 128x32x16_32x8x1_4x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 128x64x8_32x16x1_4x4_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 128x128x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, 256x64x8_64x16x1_8x4_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_n.cu b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_n.cu index 102a7e1..102a4a2 100644 --- a/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_n.cu +++ b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 16x32x8_16x32x1_4x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 16x64x8_16x64x1_4x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 32x32x8_32x32x1_8x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 32x64x8_32x64x1_8x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 64x32x8_64x32x1_8x8_8x4_1x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 16x32x8_16x16x1_4x2_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 16x64x8_16x32x1_4x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 16x128x8_16x64x1_4x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 32x32x8_32x16x1_4x4_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 32x64x8_32x32x1_8x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 32x128x8_32x64x1_8x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 64x64x8_64x32x1_8x8_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 32x32x8_16x32x1_4x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 64x32x8_32x32x1_8x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 64x64x8_32x64x1_8x8_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 128x32x8_64x32x1_8x8_8x4_2x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 16x32x8_8x16x1_2x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 16x64x8_8x32x1_2x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 32x32x8_16x16x1_4x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 32x64x8_16x32x1_4x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 32x128x8_16x64x1_4x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 64x32x8_32x16x1_4x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 64x64x8_32x32x1_8x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 64x128x8_32x64x1_8x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 128x32x8_64x16x1_8x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 128x64x8_64x32x1_8x8_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 16x64x16_8x16x1_2x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 16x128x16_8x32x1_2x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 32x32x8_16x8x1_2x2_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 32x64x8_16x16x1_4x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 32x128x8_16x32x1_4x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 32x256x8_16x64x1_4x8_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 64x64x8_32x16x1_4x4_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 64x128x8_32x32x1_8x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 64x256x8_32x64x1_8x8_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 128x128x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 32x32x8_8x16x1_2x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 64x32x8_16x16x1_4x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 64x64x8_16x32x1_4x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 128x32x8_32x16x1_4x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 128x64x8_32x32x1_8x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 128x128x8_32x64x1_8x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 256x32x8_64x16x1_8x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 256x64x8_64x32x1_8x8_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 32x64x16_8x16x1_2x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 32x128x16_8x32x1_2x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 64x32x16_16x8x1_2x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 64x64x8_16x16x1_4x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 64x128x8_16x32x1_4x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 64x256x8_16x64x1_4x8_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 128x32x16_32x8x1_4x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 128x64x8_32x16x1_4x4_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 128x128x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, 256x64x8_64x16x1_8x4_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_t.cu b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_t.cu index ae6fafe..86a75a5 100644 --- a/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_t.cu +++ b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_nt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 16x32x8_16x32x1_4x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 16x64x8_16x64x1_4x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 32x32x8_32x32x1_8x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 32x64x8_32x64x1_8x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 64x32x8_64x32x1_8x8_8x4_1x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 16x32x8_16x16x1_4x2_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 16x64x8_16x32x1_4x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 16x128x8_16x64x1_4x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 32x32x8_32x16x1_4x4_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 32x64x8_32x32x1_8x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 32x128x8_32x64x1_8x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 64x64x8_64x32x1_8x8_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 32x32x8_16x32x1_4x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 64x32x8_32x32x1_8x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 64x64x8_32x64x1_8x8_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 128x32x8_64x32x1_8x8_8x4_2x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 16x32x8_8x16x1_2x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 16x64x8_8x32x1_2x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 32x32x8_16x16x1_4x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 32x64x8_16x32x1_4x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 32x128x8_16x64x1_4x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 64x32x8_32x16x1_4x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 64x64x8_32x32x1_8x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 64x128x8_32x64x1_8x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 128x32x8_64x16x1_8x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 128x64x8_64x32x1_8x8_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 16x64x16_8x16x1_2x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 16x128x16_8x32x1_2x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 32x32x8_16x8x1_2x2_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 32x64x8_16x16x1_4x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 32x128x8_16x32x1_4x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 32x256x8_16x64x1_4x8_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 64x64x8_32x16x1_4x4_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 64x128x8_32x32x1_8x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 64x256x8_32x64x1_8x8_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 128x128x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 32x32x8_8x16x1_2x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 64x32x8_16x16x1_4x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 64x64x8_16x32x1_4x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 128x32x8_32x16x1_4x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 128x64x8_32x32x1_8x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 128x128x8_32x64x1_8x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 256x32x8_64x16x1_8x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 256x64x8_64x32x1_8x8_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 32x64x16_8x16x1_2x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 32x128x16_8x32x1_2x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 64x32x16_16x8x1_2x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 64x64x8_16x16x1_4x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 64x128x8_16x32x1_4x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 64x256x8_16x64x1_4x8_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 128x32x16_32x8x1_4x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 128x64x8_32x16x1_4x4_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 128x128x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, 256x64x8_64x16x1_8x4_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_n.cu b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_n.cu index f2a06a6..0be75ca 100644 --- a/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_n.cu +++ b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 16x32x8_16x32x1_4x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 16x64x8_16x64x1_4x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 32x32x8_32x32x1_8x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 32x64x8_32x64x1_8x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 64x32x8_64x32x1_8x8_8x4_1x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 16x32x8_16x16x1_4x2_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 16x64x8_16x32x1_4x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 16x128x8_16x64x1_4x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 32x32x8_32x16x1_4x4_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 32x64x8_32x32x1_8x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 32x128x8_32x64x1_8x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 64x64x8_64x32x1_8x8_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 32x32x8_16x32x1_4x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 64x32x8_32x32x1_8x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 64x64x8_32x64x1_8x8_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 128x32x8_64x32x1_8x8_8x4_2x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 16x32x8_8x16x1_2x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 16x64x8_8x32x1_2x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 32x32x8_16x16x1_4x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 32x64x8_16x32x1_4x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 32x128x8_16x64x1_4x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 64x32x8_32x16x1_4x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 64x64x8_32x32x1_8x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 64x128x8_32x64x1_8x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 128x32x8_64x16x1_8x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 128x64x8_64x32x1_8x8_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 16x64x16_8x16x1_2x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 16x128x16_8x32x1_2x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 32x32x8_16x8x1_2x2_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 32x64x8_16x16x1_4x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 32x128x8_16x32x1_4x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 32x256x8_16x64x1_4x8_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 64x64x8_32x16x1_4x4_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 64x128x8_32x32x1_8x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 64x256x8_32x64x1_8x8_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 128x128x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 32x32x8_8x16x1_2x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 64x32x8_16x16x1_4x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 64x64x8_16x32x1_4x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 128x32x8_32x16x1_4x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 128x64x8_32x32x1_8x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 128x128x8_32x64x1_8x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 256x32x8_64x16x1_8x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 256x64x8_64x32x1_8x8_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 32x64x16_8x16x1_2x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 32x128x16_8x32x1_2x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 64x32x16_16x8x1_2x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 64x64x8_16x16x1_4x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 64x128x8_16x32x1_4x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 64x256x8_16x64x1_4x8_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 128x32x16_32x8x1_4x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 128x64x8_32x16x1_4x4_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 128x128x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, 256x64x8_64x16x1_8x4_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_t.cu b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_t.cu index 79bd59f..30579e1 100644 --- a/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_t.cu +++ b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 16x32x8_16x32x1_4x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 16x64x8_16x64x1_4x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 32x32x8_32x32x1_8x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 32x64x8_32x64x1_8x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 64x32x8_64x32x1_8x8_8x4_1x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 16x32x8_16x16x1_4x2_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 16x64x8_16x32x1_4x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 16x128x8_16x64x1_4x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 32x32x8_32x16x1_4x4_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 32x64x8_32x32x1_8x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 32x128x8_32x64x1_8x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 64x64x8_64x32x1_8x8_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 32x32x8_16x32x1_4x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 64x32x8_32x32x1_8x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 64x64x8_32x64x1_8x8_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 128x32x8_64x32x1_8x8_8x4_2x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 16x32x8_8x16x1_2x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 16x64x8_8x32x1_2x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 32x32x8_16x16x1_4x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 32x64x8_16x32x1_4x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 32x128x8_16x64x1_4x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 64x32x8_32x16x1_4x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 64x64x8_32x32x1_8x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 64x128x8_32x64x1_8x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 128x32x8_64x16x1_8x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 128x64x8_64x32x1_8x8_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 16x64x16_8x16x1_2x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 16x128x16_8x32x1_2x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 32x32x8_16x8x1_2x2_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 32x64x8_16x16x1_4x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 32x128x8_16x32x1_4x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 32x256x8_16x64x1_4x8_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 64x64x8_32x16x1_4x4_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 64x128x8_32x32x1_8x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 64x256x8_32x64x1_8x8_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 128x128x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 32x32x8_8x16x1_2x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 64x32x8_16x16x1_4x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 64x64x8_16x32x1_4x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 128x32x8_32x16x1_4x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 128x64x8_32x32x1_8x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 128x128x8_32x64x1_8x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 256x32x8_64x16x1_8x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 256x64x8_64x32x1_8x8_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 32x64x16_8x16x1_2x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 32x128x16_8x32x1_2x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 64x32x16_16x8x1_2x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 64x64x8_16x16x1_4x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 64x128x8_16x32x1_4x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 64x256x8_16x64x1_4x8_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 128x32x16_32x8x1_4x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 128x64x8_32x16x1_4x4_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 128x128x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, 256x64x8_64x16x1_8x4_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_n.cu b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_n.cu index 34e7c3b..b96fc1f 100644 --- a/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_n.cu +++ b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 16x32x8_16x32x1_4x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 16x64x8_16x64x1_4x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 32x32x8_32x32x1_8x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 32x64x8_32x64x1_8x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 64x32x8_64x32x1_8x8_8x4_1x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 16x32x8_16x16x1_4x2_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 16x64x8_16x32x1_4x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 16x128x8_16x64x1_4x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 32x32x8_32x16x1_4x4_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 32x64x8_32x32x1_8x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 32x128x8_32x64x1_8x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 64x64x8_64x32x1_8x8_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 32x32x8_16x32x1_4x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 64x32x8_32x32x1_8x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 64x64x8_32x64x1_8x8_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 128x32x8_64x32x1_8x8_8x4_2x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 16x32x8_8x16x1_2x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 16x64x8_8x32x1_2x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 32x32x8_16x16x1_4x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 32x64x8_16x32x1_4x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 32x128x8_16x64x1_4x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 64x32x8_32x16x1_4x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 64x64x8_32x32x1_8x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 64x128x8_32x64x1_8x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 128x32x8_64x16x1_8x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 128x64x8_64x32x1_8x8_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 16x64x16_8x16x1_2x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 16x128x16_8x32x1_2x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 32x32x8_16x8x1_2x2_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 32x64x8_16x16x1_4x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 32x128x8_16x32x1_4x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 32x256x8_16x64x1_4x8_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 64x64x8_32x16x1_4x4_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 64x128x8_32x32x1_8x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 64x256x8_32x64x1_8x8_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 128x128x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 32x32x8_8x16x1_2x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 64x32x8_16x16x1_4x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 64x64x8_16x32x1_4x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 128x32x8_32x16x1_4x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 128x64x8_32x32x1_8x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 128x128x8_32x64x1_8x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 256x32x8_64x16x1_8x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 256x64x8_64x32x1_8x8_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 32x64x16_8x16x1_2x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 32x128x16_8x32x1_2x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 64x32x16_16x8x1_2x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 64x64x8_16x16x1_4x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 64x128x8_16x32x1_4x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 64x256x8_16x64x1_4x8_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 128x32x16_32x8x1_4x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 128x64x8_32x16x1_4x4_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 128x128x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, 256x64x8_64x16x1_8x4_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_t.cu b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_t.cu index 5fe557d..e3b5a51 100644 --- a/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_t.cu +++ b/test/device/sm50_simt_binary_or_binary_and_ssrgemm_tt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 16x32x8_16x32x1_4x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 16x64x8_16x64x1_4x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 32x32x8_32x32x1_8x4_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 32x64x8_32x64x1_8x8_4x8_1x1) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 64x32x8_64x32x1_8x8_8x4_1x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 16x32x8_16x16x1_4x2_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 16x64x8_16x32x1_4x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 16x128x8_16x64x1_4x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 32x32x8_32x16x1_4x4_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 32x64x8_32x32x1_8x4_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 32x128x8_32x64x1_8x8_4x8_1x2 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 64x64x8_64x32x1_8x8_8x4_1x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 32x32x8_16x32x1_4x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 64x32x8_32x32x1_8x4_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 64x64x8_32x64x1_8x8_4x8_2x1) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 128x32x8_64x32x1_8x8_8x4_2x1 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 16x32x8_8x16x1_2x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 16x64x8_8x32x1_2x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 32x32x8_16x16x1_4x2_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 32x64x8_16x32x1_4x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 32x128x8_16x64x1_4x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 64x32x8_32x16x1_4x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 64x64x8_32x32x1_8x4_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 64x128x8_32x64x1_8x8_4x8_2x2 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 128x32x8_64x16x1_8x4_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 128x64x8_64x32x1_8x8_8x4_2x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 16x64x16_8x16x1_2x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 16x128x16_8x32x1_2x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 32x32x8_16x8x1_2x2_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 32x64x8_16x16x1_4x2_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 32x128x8_16x32x1_4x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 32x256x8_16x64x1_4x8_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 64x64x8_32x16x1_4x4_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 64x128x8_32x32x1_8x4_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 64x256x8_32x64x1_8x8_4x8_2x4 using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 128x128x8_64x32x1_8x8_8x4_2x using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 32x32x8_8x16x1_2x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 64x32x8_16x16x1_4x2_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 64x64x8_16x32x1_4x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 128x32x8_32x16x1_4x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 128x64x8_32x32x1_8x4_4x8_4x2 using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 128x128x8_32x64x1_8x8_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 256x32x8_64x16x1_8x4_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 256x64x8_64x32x1_8x8_8x4_4x2 using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 32x64x16_8x16x1_2x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 32x128x16_8x32x1_2x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 64x32x16_16x8x1_2x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 64x64x8_16x16x1_4x2_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 64x128x8_16x32x1_4x4_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 64x256x8_16x64x1_4x8_4x8_4x4 using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 128x32x16_32x8x1_4x2_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 128x64x8_32x16x1_4x4_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 128x128x8_32x32x1_8x4_4x8_4x using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, 256x64x8_64x16x1_8x4_8x4_4x4 using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::binary_or, cuasr::binary_and, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::binary_or, cuasr::binary_and, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_minimum_dsrgemm_nn_n.cu b/test/device/sm50_simt_maximum_minimum_dsrgemm_nn_n.cu index 5946f66..360b891 100644 --- a/test/device/sm50_simt_maximum_minimum_dsrgemm_nn_n.cu +++ b/test/device/sm50_simt_maximum_minimum_dsrgemm_nn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_minimum_dsrgemm_nn_t.cu b/test/device/sm50_simt_maximum_minimum_dsrgemm_nn_t.cu index 300355c..2c49dbf 100644 --- a/test/device/sm50_simt_maximum_minimum_dsrgemm_nn_t.cu +++ b/test/device/sm50_simt_maximum_minimum_dsrgemm_nn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_minimum_dsrgemm_nt_n.cu b/test/device/sm50_simt_maximum_minimum_dsrgemm_nt_n.cu index 35a92b9..b150275 100644 --- a/test/device/sm50_simt_maximum_minimum_dsrgemm_nt_n.cu +++ b/test/device/sm50_simt_maximum_minimum_dsrgemm_nt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_minimum_dsrgemm_nt_t.cu b/test/device/sm50_simt_maximum_minimum_dsrgemm_nt_t.cu index 5f41aaf..f0dd63e 100644 --- a/test/device/sm50_simt_maximum_minimum_dsrgemm_nt_t.cu +++ b/test/device/sm50_simt_maximum_minimum_dsrgemm_nt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_minimum_dsrgemm_tn_n.cu b/test/device/sm50_simt_maximum_minimum_dsrgemm_tn_n.cu index 391db03..f44fe18 100644 --- a/test/device/sm50_simt_maximum_minimum_dsrgemm_tn_n.cu +++ b/test/device/sm50_simt_maximum_minimum_dsrgemm_tn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_minimum_dsrgemm_tn_t.cu b/test/device/sm50_simt_maximum_minimum_dsrgemm_tn_t.cu index 59a437b..ac70846 100644 --- a/test/device/sm50_simt_maximum_minimum_dsrgemm_tn_t.cu +++ b/test/device/sm50_simt_maximum_minimum_dsrgemm_tn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_minimum_dsrgemm_tt_n.cu b/test/device/sm50_simt_maximum_minimum_dsrgemm_tt_n.cu index 194615c..126a7d8 100644 --- a/test/device/sm50_simt_maximum_minimum_dsrgemm_tt_n.cu +++ b/test/device/sm50_simt_maximum_minimum_dsrgemm_tt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_minimum_dsrgemm_tt_t.cu b/test/device/sm50_simt_maximum_minimum_dsrgemm_tt_t.cu index 56f8f95..a07485a 100644 --- a/test/device/sm50_simt_maximum_minimum_dsrgemm_tt_t.cu +++ b/test/device/sm50_simt_maximum_minimum_dsrgemm_tt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_minimum_ssrgemm_nn_n.cu b/test/device/sm50_simt_maximum_minimum_ssrgemm_nn_n.cu index 0dbd857..cac2b9e 100644 --- a/test/device/sm50_simt_maximum_minimum_ssrgemm_nn_n.cu +++ b/test/device/sm50_simt_maximum_minimum_ssrgemm_nn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_minimum_ssrgemm_nn_t.cu b/test/device/sm50_simt_maximum_minimum_ssrgemm_nn_t.cu index 64786fe..46551ea 100644 --- a/test/device/sm50_simt_maximum_minimum_ssrgemm_nn_t.cu +++ b/test/device/sm50_simt_maximum_minimum_ssrgemm_nn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_minimum_ssrgemm_nt_n.cu b/test/device/sm50_simt_maximum_minimum_ssrgemm_nt_n.cu index 1a983dc..bd78db8 100644 --- a/test/device/sm50_simt_maximum_minimum_ssrgemm_nt_n.cu +++ b/test/device/sm50_simt_maximum_minimum_ssrgemm_nt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_minimum_ssrgemm_nt_t.cu b/test/device/sm50_simt_maximum_minimum_ssrgemm_nt_t.cu index a4a5981..885b7db 100644 --- a/test/device/sm50_simt_maximum_minimum_ssrgemm_nt_t.cu +++ b/test/device/sm50_simt_maximum_minimum_ssrgemm_nt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_minimum_ssrgemm_tn_n.cu b/test/device/sm50_simt_maximum_minimum_ssrgemm_tn_n.cu index 491ced1..dd036be 100644 --- a/test/device/sm50_simt_maximum_minimum_ssrgemm_tn_n.cu +++ b/test/device/sm50_simt_maximum_minimum_ssrgemm_tn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_minimum_ssrgemm_tn_t.cu b/test/device/sm50_simt_maximum_minimum_ssrgemm_tn_t.cu index 2ff0802..2e5cdef 100644 --- a/test/device/sm50_simt_maximum_minimum_ssrgemm_tn_t.cu +++ b/test/device/sm50_simt_maximum_minimum_ssrgemm_tn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_minimum_ssrgemm_tt_n.cu b/test/device/sm50_simt_maximum_minimum_ssrgemm_tt_n.cu index 7360a72..d291ac3 100644 --- a/test/device/sm50_simt_maximum_minimum_ssrgemm_tt_n.cu +++ b/test/device/sm50_simt_maximum_minimum_ssrgemm_tt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_minimum_ssrgemm_tt_t.cu b/test/device/sm50_simt_maximum_minimum_ssrgemm_tt_t.cu index 22b2041..8d53dcf 100644 --- a/test/device/sm50_simt_maximum_minimum_ssrgemm_tt_t.cu +++ b/test/device/sm50_simt_maximum_minimum_ssrgemm_tt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::minimum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::minimum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_multiplies_dsrgemm_nn_n.cu b/test/device/sm50_simt_maximum_multiplies_dsrgemm_nn_n.cu index 9412254..93ef89f 100644 --- a/test/device/sm50_simt_maximum_multiplies_dsrgemm_nn_n.cu +++ b/test/device/sm50_simt_maximum_multiplies_dsrgemm_nn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_multiplies_dsrgemm_nn_t.cu b/test/device/sm50_simt_maximum_multiplies_dsrgemm_nn_t.cu index 2cbfc31..3fe4dbd 100644 --- a/test/device/sm50_simt_maximum_multiplies_dsrgemm_nn_t.cu +++ b/test/device/sm50_simt_maximum_multiplies_dsrgemm_nn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_multiplies_dsrgemm_nt_n.cu b/test/device/sm50_simt_maximum_multiplies_dsrgemm_nt_n.cu index f431ccc..c39296a 100644 --- a/test/device/sm50_simt_maximum_multiplies_dsrgemm_nt_n.cu +++ b/test/device/sm50_simt_maximum_multiplies_dsrgemm_nt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_multiplies_dsrgemm_nt_t.cu b/test/device/sm50_simt_maximum_multiplies_dsrgemm_nt_t.cu index 84c4fc5..a3a4c37 100644 --- a/test/device/sm50_simt_maximum_multiplies_dsrgemm_nt_t.cu +++ b/test/device/sm50_simt_maximum_multiplies_dsrgemm_nt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_multiplies_dsrgemm_tn_n.cu b/test/device/sm50_simt_maximum_multiplies_dsrgemm_tn_n.cu index 962f529..204dc47 100644 --- a/test/device/sm50_simt_maximum_multiplies_dsrgemm_tn_n.cu +++ b/test/device/sm50_simt_maximum_multiplies_dsrgemm_tn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_multiplies_dsrgemm_tn_t.cu b/test/device/sm50_simt_maximum_multiplies_dsrgemm_tn_t.cu index f7184e0..9a447f4 100644 --- a/test/device/sm50_simt_maximum_multiplies_dsrgemm_tn_t.cu +++ b/test/device/sm50_simt_maximum_multiplies_dsrgemm_tn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_multiplies_dsrgemm_tt_n.cu b/test/device/sm50_simt_maximum_multiplies_dsrgemm_tt_n.cu index 58f7d5e..bf34b76 100644 --- a/test/device/sm50_simt_maximum_multiplies_dsrgemm_tt_n.cu +++ b/test/device/sm50_simt_maximum_multiplies_dsrgemm_tt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_multiplies_dsrgemm_tt_t.cu b/test/device/sm50_simt_maximum_multiplies_dsrgemm_tt_t.cu index 3a3af40..6971426 100644 --- a/test/device/sm50_simt_maximum_multiplies_dsrgemm_tt_t.cu +++ b/test/device/sm50_simt_maximum_multiplies_dsrgemm_tt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_multiplies_ssrgemm_nn_n.cu b/test/device/sm50_simt_maximum_multiplies_ssrgemm_nn_n.cu index 28cf3e2..dba2055 100644 --- a/test/device/sm50_simt_maximum_multiplies_ssrgemm_nn_n.cu +++ b/test/device/sm50_simt_maximum_multiplies_ssrgemm_nn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 32x128x8_32x64x1_8x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 128x32x8_64x32x1_8x8_8x4_2x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 64x128x8_32x64x1_8x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 128x64x8_64x32x1_8x8_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 32x256x8_16x64x1_4x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 64x128x8_32x32x1_8x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 64x256x8_32x64x1_8x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 128x128x8_64x32x1_8x8_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 128x64x8_32x32x1_8x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 128x128x8_32x64x1_8x8_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 256x32x8_64x16x1_8x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 256x64x8_64x32x1_8x8_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 64x128x8_16x32x1_4x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 64x256x8_16x64x1_4x8_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 128x64x8_32x16x1_4x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 128x128x8_32x32x1_8x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, 256x64x8_64x16x1_8x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_multiplies_ssrgemm_nn_t.cu b/test/device/sm50_simt_maximum_multiplies_ssrgemm_nn_t.cu index 33f4052..4f5b298 100644 --- a/test/device/sm50_simt_maximum_multiplies_ssrgemm_nn_t.cu +++ b/test/device/sm50_simt_maximum_multiplies_ssrgemm_nn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 32x128x8_32x64x1_8x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 128x32x8_64x32x1_8x8_8x4_2x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 64x128x8_32x64x1_8x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 128x64x8_64x32x1_8x8_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 32x256x8_16x64x1_4x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 64x128x8_32x32x1_8x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 64x256x8_32x64x1_8x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 128x128x8_64x32x1_8x8_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 128x64x8_32x32x1_8x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 128x128x8_32x64x1_8x8_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 256x32x8_64x16x1_8x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 256x64x8_64x32x1_8x8_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 64x128x8_16x32x1_4x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 64x256x8_16x64x1_4x8_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 128x64x8_32x16x1_4x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 128x128x8_32x32x1_8x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, 256x64x8_64x16x1_8x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_multiplies_ssrgemm_nt_n.cu b/test/device/sm50_simt_maximum_multiplies_ssrgemm_nt_n.cu index 61763eb..0cdf231 100644 --- a/test/device/sm50_simt_maximum_multiplies_ssrgemm_nt_n.cu +++ b/test/device/sm50_simt_maximum_multiplies_ssrgemm_nt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 32x128x8_32x64x1_8x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 128x32x8_64x32x1_8x8_8x4_2x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 64x128x8_32x64x1_8x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 128x64x8_64x32x1_8x8_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 32x256x8_16x64x1_4x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 64x128x8_32x32x1_8x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 64x256x8_32x64x1_8x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 128x128x8_64x32x1_8x8_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 128x64x8_32x32x1_8x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 128x128x8_32x64x1_8x8_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 256x32x8_64x16x1_8x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 256x64x8_64x32x1_8x8_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 64x128x8_16x32x1_4x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 64x256x8_16x64x1_4x8_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 128x64x8_32x16x1_4x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 128x128x8_32x32x1_8x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, 256x64x8_64x16x1_8x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_multiplies_ssrgemm_nt_t.cu b/test/device/sm50_simt_maximum_multiplies_ssrgemm_nt_t.cu index 9de8d19..e8b08ed 100644 --- a/test/device/sm50_simt_maximum_multiplies_ssrgemm_nt_t.cu +++ b/test/device/sm50_simt_maximum_multiplies_ssrgemm_nt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 32x128x8_32x64x1_8x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 128x32x8_64x32x1_8x8_8x4_2x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 64x128x8_32x64x1_8x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 128x64x8_64x32x1_8x8_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 32x256x8_16x64x1_4x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 64x128x8_32x32x1_8x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 64x256x8_32x64x1_8x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 128x128x8_64x32x1_8x8_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 128x64x8_32x32x1_8x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 128x128x8_32x64x1_8x8_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 256x32x8_64x16x1_8x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 256x64x8_64x32x1_8x8_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 64x128x8_16x32x1_4x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 64x256x8_16x64x1_4x8_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 128x64x8_32x16x1_4x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 128x128x8_32x32x1_8x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, 256x64x8_64x16x1_8x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_multiplies_ssrgemm_tn_n.cu b/test/device/sm50_simt_maximum_multiplies_ssrgemm_tn_n.cu index b79d773..7d7f40a 100644 --- a/test/device/sm50_simt_maximum_multiplies_ssrgemm_tn_n.cu +++ b/test/device/sm50_simt_maximum_multiplies_ssrgemm_tn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 32x128x8_32x64x1_8x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 128x32x8_64x32x1_8x8_8x4_2x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 64x128x8_32x64x1_8x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 128x64x8_64x32x1_8x8_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 32x256x8_16x64x1_4x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 64x128x8_32x32x1_8x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 64x256x8_32x64x1_8x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 128x128x8_64x32x1_8x8_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 128x64x8_32x32x1_8x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 128x128x8_32x64x1_8x8_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 256x32x8_64x16x1_8x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 256x64x8_64x32x1_8x8_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 64x128x8_16x32x1_4x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 64x256x8_16x64x1_4x8_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 128x64x8_32x16x1_4x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 128x128x8_32x32x1_8x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, 256x64x8_64x16x1_8x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_multiplies_ssrgemm_tn_t.cu b/test/device/sm50_simt_maximum_multiplies_ssrgemm_tn_t.cu index 0b0de63..715df12 100644 --- a/test/device/sm50_simt_maximum_multiplies_ssrgemm_tn_t.cu +++ b/test/device/sm50_simt_maximum_multiplies_ssrgemm_tn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 32x128x8_32x64x1_8x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 128x32x8_64x32x1_8x8_8x4_2x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 64x128x8_32x64x1_8x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 128x64x8_64x32x1_8x8_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 32x256x8_16x64x1_4x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 64x128x8_32x32x1_8x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 64x256x8_32x64x1_8x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 128x128x8_64x32x1_8x8_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 128x64x8_32x32x1_8x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 128x128x8_32x64x1_8x8_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 256x32x8_64x16x1_8x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 256x64x8_64x32x1_8x8_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 64x128x8_16x32x1_4x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 64x256x8_16x64x1_4x8_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 128x64x8_32x16x1_4x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 128x128x8_32x32x1_8x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, 256x64x8_64x16x1_8x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_multiplies_ssrgemm_tt_n.cu b/test/device/sm50_simt_maximum_multiplies_ssrgemm_tt_n.cu index 25220fa..5ad67fc 100644 --- a/test/device/sm50_simt_maximum_multiplies_ssrgemm_tt_n.cu +++ b/test/device/sm50_simt_maximum_multiplies_ssrgemm_tt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 32x128x8_32x64x1_8x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 128x32x8_64x32x1_8x8_8x4_2x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 64x128x8_32x64x1_8x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 128x64x8_64x32x1_8x8_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 32x256x8_16x64x1_4x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 64x128x8_32x32x1_8x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 64x256x8_32x64x1_8x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 128x128x8_64x32x1_8x8_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 128x64x8_32x32x1_8x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 128x128x8_32x64x1_8x8_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 256x32x8_64x16x1_8x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 256x64x8_64x32x1_8x8_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 64x128x8_16x32x1_4x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 64x256x8_16x64x1_4x8_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 128x64x8_32x16x1_4x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 128x128x8_32x32x1_8x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, 256x64x8_64x16x1_8x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_multiplies_ssrgemm_tt_t.cu b/test/device/sm50_simt_maximum_multiplies_ssrgemm_tt_t.cu index ed894ad..bf7fbb4 100644 --- a/test/device/sm50_simt_maximum_multiplies_ssrgemm_tt_t.cu +++ b/test/device/sm50_simt_maximum_multiplies_ssrgemm_tt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 32x128x8_32x64x1_8x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 128x32x8_64x32x1_8x8_8x4_2x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 64x128x8_32x64x1_8x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 128x64x8_64x32x1_8x8_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 32x256x8_16x64x1_4x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 64x128x8_32x32x1_8x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 64x256x8_32x64x1_8x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 128x128x8_64x32x1_8x8_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 128x64x8_32x32x1_8x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 128x128x8_32x64x1_8x8_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 256x32x8_64x16x1_8x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 256x64x8_64x32x1_8x8_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 64x128x8_16x32x1_4x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 64x256x8_16x64x1_4x8_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 128x64x8_32x16x1_4x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 128x128x8_32x32x1_8x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, 256x64x8_64x16x1_8x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_plus_dsrgemm_nn_n.cu b/test/device/sm50_simt_maximum_plus_dsrgemm_nn_n.cu index 4a1c313..d84235d 100644 --- a/test/device/sm50_simt_maximum_plus_dsrgemm_nn_n.cu +++ b/test/device/sm50_simt_maximum_plus_dsrgemm_nn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_plus_dsrgemm_nn_t.cu b/test/device/sm50_simt_maximum_plus_dsrgemm_nn_t.cu index 2aa813e..507b38b 100644 --- a/test/device/sm50_simt_maximum_plus_dsrgemm_nn_t.cu +++ b/test/device/sm50_simt_maximum_plus_dsrgemm_nn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_plus_dsrgemm_nt_n.cu b/test/device/sm50_simt_maximum_plus_dsrgemm_nt_n.cu index 367652b..bc09a67 100644 --- a/test/device/sm50_simt_maximum_plus_dsrgemm_nt_n.cu +++ b/test/device/sm50_simt_maximum_plus_dsrgemm_nt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_plus_dsrgemm_nt_t.cu b/test/device/sm50_simt_maximum_plus_dsrgemm_nt_t.cu index 8b5e817..006f546 100644 --- a/test/device/sm50_simt_maximum_plus_dsrgemm_nt_t.cu +++ b/test/device/sm50_simt_maximum_plus_dsrgemm_nt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_nt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_plus_dsrgemm_tn_n.cu b/test/device/sm50_simt_maximum_plus_dsrgemm_tn_n.cu index 078312e..5675bab 100644 --- a/test/device/sm50_simt_maximum_plus_dsrgemm_tn_n.cu +++ b/test/device/sm50_simt_maximum_plus_dsrgemm_tn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_plus_dsrgemm_tn_t.cu b/test/device/sm50_simt_maximum_plus_dsrgemm_tn_t.cu index fb2156a..7b29ce5 100644 --- a/test/device/sm50_simt_maximum_plus_dsrgemm_tn_t.cu +++ b/test/device/sm50_simt_maximum_plus_dsrgemm_tn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_plus_dsrgemm_tt_n.cu b/test/device/sm50_simt_maximum_plus_dsrgemm_tt_n.cu index 92d7597..992103e 100644 --- a/test/device/sm50_simt_maximum_plus_dsrgemm_tt_n.cu +++ b/test/device/sm50_simt_maximum_plus_dsrgemm_tt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_plus_dsrgemm_tt_t.cu b/test/device/sm50_simt_maximum_plus_dsrgemm_tt_t.cu index 8600765..a3be64e 100644 --- a/test/device/sm50_simt_maximum_plus_dsrgemm_tt_t.cu +++ b/test/device/sm50_simt_maximum_plus_dsrgemm_tt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_plus_dsrgemm_tt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_plus_ssrgemm_nn_n.cu b/test/device/sm50_simt_maximum_plus_ssrgemm_nn_n.cu index 0289e86..634cc41 100644 --- a/test/device/sm50_simt_maximum_plus_ssrgemm_nn_n.cu +++ b/test/device/sm50_simt_maximum_plus_ssrgemm_nn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_plus_ssrgemm_nn_t.cu b/test/device/sm50_simt_maximum_plus_ssrgemm_nn_t.cu index 04d5adc..e556bb2 100644 --- a/test/device/sm50_simt_maximum_plus_ssrgemm_nn_t.cu +++ b/test/device/sm50_simt_maximum_plus_ssrgemm_nn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nn_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_plus_ssrgemm_nt_n.cu b/test/device/sm50_simt_maximum_plus_ssrgemm_nt_n.cu index b49dd8c..b4e72d1 100644 --- a/test/device/sm50_simt_maximum_plus_ssrgemm_nt_n.cu +++ b/test/device/sm50_simt_maximum_plus_ssrgemm_nt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_plus_ssrgemm_nt_t.cu b/test/device/sm50_simt_maximum_plus_ssrgemm_nt_t.cu index b0110d6..e482a7c 100644 --- a/test/device/sm50_simt_maximum_plus_ssrgemm_nt_t.cu +++ b/test/device/sm50_simt_maximum_plus_ssrgemm_nt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_nt_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_plus_ssrgemm_tn_n.cu b/test/device/sm50_simt_maximum_plus_ssrgemm_tn_n.cu index 84e6fa7..d997f12 100644 --- a/test/device/sm50_simt_maximum_plus_ssrgemm_tn_n.cu +++ b/test/device/sm50_simt_maximum_plus_ssrgemm_tn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_plus_ssrgemm_tn_t.cu b/test/device/sm50_simt_maximum_plus_ssrgemm_tn_t.cu index d8e96ac..c5f6e98 100644 --- a/test/device/sm50_simt_maximum_plus_ssrgemm_tn_t.cu +++ b/test/device/sm50_simt_maximum_plus_ssrgemm_tn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tn_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_plus_ssrgemm_tt_n.cu b/test/device/sm50_simt_maximum_plus_ssrgemm_tt_n.cu index ef7f2df..4fca26e 100644 --- a/test/device/sm50_simt_maximum_plus_ssrgemm_tt_n.cu +++ b/test/device/sm50_simt_maximum_plus_ssrgemm_tt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_maximum_plus_ssrgemm_tt_t.cu b/test/device/sm50_simt_maximum_plus_ssrgemm_tt_t.cu index 3fbaaa1..0ac877f 100644 --- a/test/device/sm50_simt_maximum_plus_ssrgemm_tt_t.cu +++ b/test/device/sm50_simt_maximum_plus_ssrgemm_tt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_maximum_plus_ssrgemm_tt_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::maximum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::maximum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_maximum_dsrgemm_nn_n.cu b/test/device/sm50_simt_minimum_maximum_dsrgemm_nn_n.cu index decf223..89b5369 100644 --- a/test/device/sm50_simt_minimum_maximum_dsrgemm_nn_n.cu +++ b/test/device/sm50_simt_minimum_maximum_dsrgemm_nn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_maximum_dsrgemm_nn_t.cu b/test/device/sm50_simt_minimum_maximum_dsrgemm_nn_t.cu index fbd514f..e566ef7 100644 --- a/test/device/sm50_simt_minimum_maximum_dsrgemm_nn_t.cu +++ b/test/device/sm50_simt_minimum_maximum_dsrgemm_nn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_maximum_dsrgemm_nt_n.cu b/test/device/sm50_simt_minimum_maximum_dsrgemm_nt_n.cu index ee22572..e63085e 100644 --- a/test/device/sm50_simt_minimum_maximum_dsrgemm_nt_n.cu +++ b/test/device/sm50_simt_minimum_maximum_dsrgemm_nt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_maximum_dsrgemm_nt_t.cu b/test/device/sm50_simt_minimum_maximum_dsrgemm_nt_t.cu index 786188f..9e18157 100644 --- a/test/device/sm50_simt_minimum_maximum_dsrgemm_nt_t.cu +++ b/test/device/sm50_simt_minimum_maximum_dsrgemm_nt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_maximum_dsrgemm_tn_n.cu b/test/device/sm50_simt_minimum_maximum_dsrgemm_tn_n.cu index 4ae4217..50dda07 100644 --- a/test/device/sm50_simt_minimum_maximum_dsrgemm_tn_n.cu +++ b/test/device/sm50_simt_minimum_maximum_dsrgemm_tn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_maximum_dsrgemm_tn_t.cu b/test/device/sm50_simt_minimum_maximum_dsrgemm_tn_t.cu index 42aee49..cfc9508 100644 --- a/test/device/sm50_simt_minimum_maximum_dsrgemm_tn_t.cu +++ b/test/device/sm50_simt_minimum_maximum_dsrgemm_tn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_maximum_dsrgemm_tt_n.cu b/test/device/sm50_simt_minimum_maximum_dsrgemm_tt_n.cu index e5c9a0f..4ada046 100644 --- a/test/device/sm50_simt_minimum_maximum_dsrgemm_tt_n.cu +++ b/test/device/sm50_simt_minimum_maximum_dsrgemm_tt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_maximum_dsrgemm_tt_t.cu b/test/device/sm50_simt_minimum_maximum_dsrgemm_tt_t.cu index 3765f4b..8df92ab 100644 --- a/test/device/sm50_simt_minimum_maximum_dsrgemm_tt_t.cu +++ b/test/device/sm50_simt_minimum_maximum_dsrgemm_tt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_maximum_ssrgemm_nn_n.cu b/test/device/sm50_simt_minimum_maximum_ssrgemm_nn_n.cu index e283b64..5fefb79 100644 --- a/test/device/sm50_simt_minimum_maximum_ssrgemm_nn_n.cu +++ b/test/device/sm50_simt_minimum_maximum_ssrgemm_nn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_maximum_ssrgemm_nn_t.cu b/test/device/sm50_simt_minimum_maximum_ssrgemm_nn_t.cu index edf13bc..3ebcb0c 100644 --- a/test/device/sm50_simt_minimum_maximum_ssrgemm_nn_t.cu +++ b/test/device/sm50_simt_minimum_maximum_ssrgemm_nn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_maximum_ssrgemm_nt_n.cu b/test/device/sm50_simt_minimum_maximum_ssrgemm_nt_n.cu index 8f2a3a7..d92f374 100644 --- a/test/device/sm50_simt_minimum_maximum_ssrgemm_nt_n.cu +++ b/test/device/sm50_simt_minimum_maximum_ssrgemm_nt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_maximum_ssrgemm_nt_t.cu b/test/device/sm50_simt_minimum_maximum_ssrgemm_nt_t.cu index f898ac7..bc383f7 100644 --- a/test/device/sm50_simt_minimum_maximum_ssrgemm_nt_t.cu +++ b/test/device/sm50_simt_minimum_maximum_ssrgemm_nt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_maximum_ssrgemm_tn_n.cu b/test/device/sm50_simt_minimum_maximum_ssrgemm_tn_n.cu index 6611645..ee965a0 100644 --- a/test/device/sm50_simt_minimum_maximum_ssrgemm_tn_n.cu +++ b/test/device/sm50_simt_minimum_maximum_ssrgemm_tn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_maximum_ssrgemm_tn_t.cu b/test/device/sm50_simt_minimum_maximum_ssrgemm_tn_t.cu index 5c3ae16..53c1dd9 100644 --- a/test/device/sm50_simt_minimum_maximum_ssrgemm_tn_t.cu +++ b/test/device/sm50_simt_minimum_maximum_ssrgemm_tn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_maximum_ssrgemm_tt_n.cu b/test/device/sm50_simt_minimum_maximum_ssrgemm_tt_n.cu index 2184d53..e419ad3 100644 --- a/test/device/sm50_simt_minimum_maximum_ssrgemm_tt_n.cu +++ b/test/device/sm50_simt_minimum_maximum_ssrgemm_tt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_maximum_ssrgemm_tt_t.cu b/test/device/sm50_simt_minimum_maximum_ssrgemm_tt_t.cu index af191f7..2c69297 100644 --- a/test/device/sm50_simt_minimum_maximum_ssrgemm_tt_t.cu +++ b/test/device/sm50_simt_minimum_maximum_ssrgemm_tt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::maximum, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::maximum, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_multiplies_dsrgemm_nn_n.cu b/test/device/sm50_simt_minimum_multiplies_dsrgemm_nn_n.cu index 79d645d..7694186 100644 --- a/test/device/sm50_simt_minimum_multiplies_dsrgemm_nn_n.cu +++ b/test/device/sm50_simt_minimum_multiplies_dsrgemm_nn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_multiplies_dsrgemm_nn_t.cu b/test/device/sm50_simt_minimum_multiplies_dsrgemm_nn_t.cu index 3645cc8..9bb122f 100644 --- a/test/device/sm50_simt_minimum_multiplies_dsrgemm_nn_t.cu +++ b/test/device/sm50_simt_minimum_multiplies_dsrgemm_nn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_multiplies_dsrgemm_nt_n.cu b/test/device/sm50_simt_minimum_multiplies_dsrgemm_nt_n.cu index 56ca8b7..273bc30 100644 --- a/test/device/sm50_simt_minimum_multiplies_dsrgemm_nt_n.cu +++ b/test/device/sm50_simt_minimum_multiplies_dsrgemm_nt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_multiplies_dsrgemm_nt_t.cu b/test/device/sm50_simt_minimum_multiplies_dsrgemm_nt_t.cu index 496c439..c76ac16 100644 --- a/test/device/sm50_simt_minimum_multiplies_dsrgemm_nt_t.cu +++ b/test/device/sm50_simt_minimum_multiplies_dsrgemm_nt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_multiplies_dsrgemm_tn_n.cu b/test/device/sm50_simt_minimum_multiplies_dsrgemm_tn_n.cu index e9bfe55..7995298 100644 --- a/test/device/sm50_simt_minimum_multiplies_dsrgemm_tn_n.cu +++ b/test/device/sm50_simt_minimum_multiplies_dsrgemm_tn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_multiplies_dsrgemm_tn_t.cu b/test/device/sm50_simt_minimum_multiplies_dsrgemm_tn_t.cu index 669b8cd..2193d15 100644 --- a/test/device/sm50_simt_minimum_multiplies_dsrgemm_tn_t.cu +++ b/test/device/sm50_simt_minimum_multiplies_dsrgemm_tn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_multiplies_dsrgemm_tt_n.cu b/test/device/sm50_simt_minimum_multiplies_dsrgemm_tt_n.cu index 29fd0e7..661e6dc 100644 --- a/test/device/sm50_simt_minimum_multiplies_dsrgemm_tt_n.cu +++ b/test/device/sm50_simt_minimum_multiplies_dsrgemm_tt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_multiplies_dsrgemm_tt_t.cu b/test/device/sm50_simt_minimum_multiplies_dsrgemm_tt_t.cu index 4cd90e9..2259d6d 100644 --- a/test/device/sm50_simt_minimum_multiplies_dsrgemm_tt_t.cu +++ b/test/device/sm50_simt_minimum_multiplies_dsrgemm_tt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_multiplies_ssrgemm_nn_n.cu b/test/device/sm50_simt_minimum_multiplies_ssrgemm_nn_n.cu index 48c4034..c4e5a02 100644 --- a/test/device/sm50_simt_minimum_multiplies_ssrgemm_nn_n.cu +++ b/test/device/sm50_simt_minimum_multiplies_ssrgemm_nn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 32x128x8_32x64x1_8x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 128x32x8_64x32x1_8x8_8x4_2x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 64x128x8_32x64x1_8x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 128x64x8_64x32x1_8x8_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 32x256x8_16x64x1_4x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 64x128x8_32x32x1_8x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 64x256x8_32x64x1_8x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 128x128x8_64x32x1_8x8_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 128x64x8_32x32x1_8x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 128x128x8_32x64x1_8x8_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 256x32x8_64x16x1_8x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 256x64x8_64x32x1_8x8_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 64x128x8_16x32x1_4x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 64x256x8_16x64x1_4x8_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 128x64x8_32x16x1_4x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 128x128x8_32x32x1_8x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, 256x64x8_64x16x1_8x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_multiplies_ssrgemm_nn_t.cu b/test/device/sm50_simt_minimum_multiplies_ssrgemm_nn_t.cu index 3f7a034..a33b767 100644 --- a/test/device/sm50_simt_minimum_multiplies_ssrgemm_nn_t.cu +++ b/test/device/sm50_simt_minimum_multiplies_ssrgemm_nn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 32x128x8_32x64x1_8x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 128x32x8_64x32x1_8x8_8x4_2x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 64x128x8_32x64x1_8x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 128x64x8_64x32x1_8x8_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 32x256x8_16x64x1_4x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 64x128x8_32x32x1_8x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 64x256x8_32x64x1_8x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 128x128x8_64x32x1_8x8_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 128x64x8_32x32x1_8x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 128x128x8_32x64x1_8x8_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 256x32x8_64x16x1_8x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 256x64x8_64x32x1_8x8_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 64x128x8_16x32x1_4x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 64x256x8_16x64x1_4x8_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 128x64x8_32x16x1_4x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 128x128x8_32x32x1_8x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, 256x64x8_64x16x1_8x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_multiplies_ssrgemm_nt_n.cu b/test/device/sm50_simt_minimum_multiplies_ssrgemm_nt_n.cu index 776736d..8f540e4 100644 --- a/test/device/sm50_simt_minimum_multiplies_ssrgemm_nt_n.cu +++ b/test/device/sm50_simt_minimum_multiplies_ssrgemm_nt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 32x128x8_32x64x1_8x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 128x32x8_64x32x1_8x8_8x4_2x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 64x128x8_32x64x1_8x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 128x64x8_64x32x1_8x8_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 32x256x8_16x64x1_4x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 64x128x8_32x32x1_8x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 64x256x8_32x64x1_8x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 128x128x8_64x32x1_8x8_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 128x64x8_32x32x1_8x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 128x128x8_32x64x1_8x8_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 256x32x8_64x16x1_8x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 256x64x8_64x32x1_8x8_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 64x128x8_16x32x1_4x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 64x256x8_16x64x1_4x8_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 128x64x8_32x16x1_4x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 128x128x8_32x32x1_8x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, 256x64x8_64x16x1_8x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_multiplies_ssrgemm_nt_t.cu b/test/device/sm50_simt_minimum_multiplies_ssrgemm_nt_t.cu index 4388eb4..849f202 100644 --- a/test/device/sm50_simt_minimum_multiplies_ssrgemm_nt_t.cu +++ b/test/device/sm50_simt_minimum_multiplies_ssrgemm_nt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 32x128x8_32x64x1_8x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 128x32x8_64x32x1_8x8_8x4_2x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 64x128x8_32x64x1_8x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 128x64x8_64x32x1_8x8_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 32x256x8_16x64x1_4x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 64x128x8_32x32x1_8x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 64x256x8_32x64x1_8x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 128x128x8_64x32x1_8x8_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 128x64x8_32x32x1_8x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 128x128x8_32x64x1_8x8_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 256x32x8_64x16x1_8x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 256x64x8_64x32x1_8x8_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 64x128x8_16x32x1_4x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 64x256x8_16x64x1_4x8_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 128x64x8_32x16x1_4x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 128x128x8_32x32x1_8x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, 256x64x8_64x16x1_8x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_multiplies_ssrgemm_tn_n.cu b/test/device/sm50_simt_minimum_multiplies_ssrgemm_tn_n.cu index 35aeaca..97aaed9 100644 --- a/test/device/sm50_simt_minimum_multiplies_ssrgemm_tn_n.cu +++ b/test/device/sm50_simt_minimum_multiplies_ssrgemm_tn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 32x128x8_32x64x1_8x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 128x32x8_64x32x1_8x8_8x4_2x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 64x128x8_32x64x1_8x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 128x64x8_64x32x1_8x8_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 32x256x8_16x64x1_4x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 64x128x8_32x32x1_8x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 64x256x8_32x64x1_8x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 128x128x8_64x32x1_8x8_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 128x64x8_32x32x1_8x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 128x128x8_32x64x1_8x8_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 256x32x8_64x16x1_8x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 256x64x8_64x32x1_8x8_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 64x128x8_16x32x1_4x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 64x256x8_16x64x1_4x8_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 128x64x8_32x16x1_4x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 128x128x8_32x32x1_8x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, 256x64x8_64x16x1_8x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_multiplies_ssrgemm_tn_t.cu b/test/device/sm50_simt_minimum_multiplies_ssrgemm_tn_t.cu index bb8b9c7..756f285 100644 --- a/test/device/sm50_simt_minimum_multiplies_ssrgemm_tn_t.cu +++ b/test/device/sm50_simt_minimum_multiplies_ssrgemm_tn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 32x128x8_32x64x1_8x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 128x32x8_64x32x1_8x8_8x4_2x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 64x128x8_32x64x1_8x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 128x64x8_64x32x1_8x8_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 32x256x8_16x64x1_4x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 64x128x8_32x32x1_8x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 64x256x8_32x64x1_8x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 128x128x8_64x32x1_8x8_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 128x64x8_32x32x1_8x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 128x128x8_32x64x1_8x8_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 256x32x8_64x16x1_8x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 256x64x8_64x32x1_8x8_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 64x128x8_16x32x1_4x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 64x256x8_16x64x1_4x8_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 128x64x8_32x16x1_4x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 128x128x8_32x32x1_8x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, 256x64x8_64x16x1_8x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_multiplies_ssrgemm_tt_n.cu b/test/device/sm50_simt_minimum_multiplies_ssrgemm_tt_n.cu index 9521aba..592677e 100644 --- a/test/device/sm50_simt_minimum_multiplies_ssrgemm_tt_n.cu +++ b/test/device/sm50_simt_minimum_multiplies_ssrgemm_tt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 32x128x8_32x64x1_8x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 128x32x8_64x32x1_8x8_8x4_2x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 64x128x8_32x64x1_8x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 128x64x8_64x32x1_8x8_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 32x256x8_16x64x1_4x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 64x128x8_32x32x1_8x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 64x256x8_32x64x1_8x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 128x128x8_64x32x1_8x8_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 128x64x8_32x32x1_8x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 128x128x8_32x64x1_8x8_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 256x32x8_64x16x1_8x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 256x64x8_64x32x1_8x8_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 64x128x8_16x32x1_4x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 64x256x8_16x64x1_4x8_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 128x64x8_32x16x1_4x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 128x128x8_32x32x1_8x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, 256x64x8_64x16x1_8x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_multiplies_ssrgemm_tt_t.cu b/test/device/sm50_simt_minimum_multiplies_ssrgemm_tt_t.cu index b4fd358..f242537 100644 --- a/test/device/sm50_simt_minimum_multiplies_ssrgemm_tt_t.cu +++ b/test/device/sm50_simt_minimum_multiplies_ssrgemm_tt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 16x128x8_16x64x1_4x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 32x128x8_32x64x1_8x8_4x8_1x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 128x32x8_64x32x1_8x8_8x4_2x1) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 32x128x8_16x64x1_4x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 64x128x8_32x64x1_8x8_4x8_2x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 128x32x8_64x16x1_8x4_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 128x64x8_64x32x1_8x8_8x4_2x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 16x128x16_8x32x1_2x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 32x128x8_16x32x1_4x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 32x256x8_16x64x1_4x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 64x128x8_32x32x1_8x4_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 64x256x8_32x64x1_8x8_4x8_2x4) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 128x128x8_64x32x1_8x8_8x4_2x4) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 128x32x8_32x16x1_4x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 128x64x8_32x32x1_8x4_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 128x128x8_32x64x1_8x8_4x8_4x2) using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 256x32x8_64x16x1_8x4_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 256x64x8_64x32x1_8x8_8x4_4x2) using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 32x128x16_8x32x1_2x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 64x128x8_16x32x1_4x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 64x256x8_16x64x1_4x8_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 128x32x16_32x8x1_4x2_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 128x64x8_32x16x1_4x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 128x128x8_32x32x1_8x4_4x8_4x4) using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, 256x64x8_64x16x1_8x4_8x4_4x4) using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_plus_dsrgemm_nn_n.cu b/test/device/sm50_simt_minimum_plus_dsrgemm_nn_n.cu index 14b5dea..a485b57 100644 --- a/test/device/sm50_simt_minimum_plus_dsrgemm_nn_n.cu +++ b/test/device/sm50_simt_minimum_plus_dsrgemm_nn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_plus_dsrgemm_nn_t.cu b/test/device/sm50_simt_minimum_plus_dsrgemm_nn_t.cu index d2f5b82..41a84d5 100644 --- a/test/device/sm50_simt_minimum_plus_dsrgemm_nn_t.cu +++ b/test/device/sm50_simt_minimum_plus_dsrgemm_nn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_plus_dsrgemm_nt_n.cu b/test/device/sm50_simt_minimum_plus_dsrgemm_nt_n.cu index 8263aae..f4efc00 100644 --- a/test/device/sm50_simt_minimum_plus_dsrgemm_nt_n.cu +++ b/test/device/sm50_simt_minimum_plus_dsrgemm_nt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_plus_dsrgemm_nt_t.cu b/test/device/sm50_simt_minimum_plus_dsrgemm_nt_t.cu index cdb73a4..0fead9b 100644 --- a/test/device/sm50_simt_minimum_plus_dsrgemm_nt_t.cu +++ b/test/device/sm50_simt_minimum_plus_dsrgemm_nt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_nt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_plus_dsrgemm_tn_n.cu b/test/device/sm50_simt_minimum_plus_dsrgemm_tn_n.cu index ead0b99..b476caa 100644 --- a/test/device/sm50_simt_minimum_plus_dsrgemm_tn_n.cu +++ b/test/device/sm50_simt_minimum_plus_dsrgemm_tn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_plus_dsrgemm_tn_t.cu b/test/device/sm50_simt_minimum_plus_dsrgemm_tn_t.cu index 216685f..ffbb3ad 100644 --- a/test/device/sm50_simt_minimum_plus_dsrgemm_tn_t.cu +++ b/test/device/sm50_simt_minimum_plus_dsrgemm_tn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_plus_dsrgemm_tt_n.cu b/test/device/sm50_simt_minimum_plus_dsrgemm_tt_n.cu index b3da2f5..3e1d36b 100644 --- a/test/device/sm50_simt_minimum_plus_dsrgemm_tt_n.cu +++ b/test/device/sm50_simt_minimum_plus_dsrgemm_tt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_plus_dsrgemm_tt_t.cu b/test/device/sm50_simt_minimum_plus_dsrgemm_tt_t.cu index c452881..a33a763 100644 --- a/test/device/sm50_simt_minimum_plus_dsrgemm_tt_t.cu +++ b/test/device/sm50_simt_minimum_plus_dsrgemm_tt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_plus_dsrgemm_tt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_plus_ssrgemm_nn_n.cu b/test/device/sm50_simt_minimum_plus_ssrgemm_nn_n.cu index 1a19a7b..f7e1b35 100644 --- a/test/device/sm50_simt_minimum_plus_ssrgemm_nn_n.cu +++ b/test/device/sm50_simt_minimum_plus_ssrgemm_nn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_plus_ssrgemm_nn_t.cu b/test/device/sm50_simt_minimum_plus_ssrgemm_nn_t.cu index df4cb7d..b0f9dcd 100644 --- a/test/device/sm50_simt_minimum_plus_ssrgemm_nn_t.cu +++ b/test/device/sm50_simt_minimum_plus_ssrgemm_nn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nn_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_plus_ssrgemm_nt_n.cu b/test/device/sm50_simt_minimum_plus_ssrgemm_nt_n.cu index cc265b1..caa11f4 100644 --- a/test/device/sm50_simt_minimum_plus_ssrgemm_nt_n.cu +++ b/test/device/sm50_simt_minimum_plus_ssrgemm_nt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_plus_ssrgemm_nt_t.cu b/test/device/sm50_simt_minimum_plus_ssrgemm_nt_t.cu index f470b8b..21e326d 100644 --- a/test/device/sm50_simt_minimum_plus_ssrgemm_nt_t.cu +++ b/test/device/sm50_simt_minimum_plus_ssrgemm_nt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_nt_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_plus_ssrgemm_tn_n.cu b/test/device/sm50_simt_minimum_plus_ssrgemm_tn_n.cu index 9d2dd21..bfafaf4 100644 --- a/test/device/sm50_simt_minimum_plus_ssrgemm_tn_n.cu +++ b/test/device/sm50_simt_minimum_plus_ssrgemm_tn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_plus_ssrgemm_tn_t.cu b/test/device/sm50_simt_minimum_plus_ssrgemm_tn_t.cu index 8cd9fcf..3c57d4c 100644 --- a/test/device/sm50_simt_minimum_plus_ssrgemm_tn_t.cu +++ b/test/device/sm50_simt_minimum_plus_ssrgemm_tn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tn_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_plus_ssrgemm_tt_n.cu b/test/device/sm50_simt_minimum_plus_ssrgemm_tt_n.cu index 0a6a561..d5af228 100644 --- a/test/device/sm50_simt_minimum_plus_ssrgemm_tt_n.cu +++ b/test/device/sm50_simt_minimum_plus_ssrgemm_tt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_minimum_plus_ssrgemm_tt_t.cu b/test/device/sm50_simt_minimum_plus_ssrgemm_tt_t.cu index 717dea4..822c20c 100644 --- a/test/device/sm50_simt_minimum_plus_ssrgemm_tt_t.cu +++ b/test/device/sm50_simt_minimum_plus_ssrgemm_tt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_minimum_plus_ssrgemm_tt_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::minimum, cuasr::plus, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::minimum, cuasr::plus, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_plus_multiplies_dsrgemm_nn_n.cu b/test/device/sm50_simt_plus_multiplies_dsrgemm_nn_n.cu index 97d031f..3a197de 100644 --- a/test/device/sm50_simt_plus_multiplies_dsrgemm_nn_n.cu +++ b/test/device/sm50_simt_plus_multiplies_dsrgemm_nn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_plus_multiplies_dsrgemm_nn_t.cu b/test/device/sm50_simt_plus_multiplies_dsrgemm_nn_t.cu index 4c238e5..79a50c5 100644 --- a/test/device/sm50_simt_plus_multiplies_dsrgemm_nn_t.cu +++ b/test/device/sm50_simt_plus_multiplies_dsrgemm_nn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_plus_multiplies_dsrgemm_nt_n.cu b/test/device/sm50_simt_plus_multiplies_dsrgemm_nt_n.cu index e958ee7..f6f29d3 100644 --- a/test/device/sm50_simt_plus_multiplies_dsrgemm_nt_n.cu +++ b/test/device/sm50_simt_plus_multiplies_dsrgemm_nt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_plus_multiplies_dsrgemm_nt_t.cu b/test/device/sm50_simt_plus_multiplies_dsrgemm_nt_t.cu index ddc481e..60d0393 100644 --- a/test/device/sm50_simt_plus_multiplies_dsrgemm_nt_t.cu +++ b/test/device/sm50_simt_plus_multiplies_dsrgemm_nt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_plus_multiplies_dsrgemm_tn_n.cu b/test/device/sm50_simt_plus_multiplies_dsrgemm_tn_n.cu index 0ac35ad..627154a 100644 --- a/test/device/sm50_simt_plus_multiplies_dsrgemm_tn_n.cu +++ b/test/device/sm50_simt_plus_multiplies_dsrgemm_tn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_plus_multiplies_dsrgemm_tn_t.cu b/test/device/sm50_simt_plus_multiplies_dsrgemm_tn_t.cu index bbd7618..21363d0 100644 --- a/test/device/sm50_simt_plus_multiplies_dsrgemm_tn_t.cu +++ b/test/device/sm50_simt_plus_multiplies_dsrgemm_tn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_plus_multiplies_dsrgemm_tt_n.cu b/test/device/sm50_simt_plus_multiplies_dsrgemm_tt_n.cu index f92a16c..adb0a86 100644 --- a/test/device/sm50_simt_plus_multiplies_dsrgemm_tt_n.cu +++ b/test/device/sm50_simt_plus_multiplies_dsrgemm_tt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_plus_multiplies_dsrgemm_tt_t.cu b/test/device/sm50_simt_plus_multiplies_dsrgemm_tt_t.cu index 70987c3..8989798 100644 --- a/test/device/sm50_simt_plus_multiplies_dsrgemm_tt_t.cu +++ b/test/device/sm50_simt_plus_multiplies_dsrgemm_tt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_plus_multiplies_ssrgemm_nn_n.cu b/test/device/sm50_simt_plus_multiplies_ssrgemm_nn_n.cu index e43e284..444fc29 100644 --- a/test/device/sm50_simt_plus_multiplies_ssrgemm_nn_n.cu +++ b/test/device/sm50_simt_plus_multiplies_ssrgemm_nn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_plus_multiplies_ssrgemm_nn_t.cu b/test/device/sm50_simt_plus_multiplies_ssrgemm_nn_t.cu index f3718d6..de9f613 100644 --- a/test/device/sm50_simt_plus_multiplies_ssrgemm_nn_t.cu +++ b/test/device/sm50_simt_plus_multiplies_ssrgemm_nn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_plus_multiplies_ssrgemm_nt_n.cu b/test/device/sm50_simt_plus_multiplies_ssrgemm_nt_n.cu index 3c59a75..d851e4e 100644 --- a/test/device/sm50_simt_plus_multiplies_ssrgemm_nt_n.cu +++ b/test/device/sm50_simt_plus_multiplies_ssrgemm_nt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_plus_multiplies_ssrgemm_nt_t.cu b/test/device/sm50_simt_plus_multiplies_ssrgemm_nt_t.cu index 266d2fd..4b64454 100644 --- a/test/device/sm50_simt_plus_multiplies_ssrgemm_nt_t.cu +++ b/test/device/sm50_simt_plus_multiplies_ssrgemm_nt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_plus_multiplies_ssrgemm_tn_n.cu b/test/device/sm50_simt_plus_multiplies_ssrgemm_tn_n.cu index fa563e5..49d73ca 100644 --- a/test/device/sm50_simt_plus_multiplies_ssrgemm_tn_n.cu +++ b/test/device/sm50_simt_plus_multiplies_ssrgemm_tn_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_plus_multiplies_ssrgemm_tn_t.cu b/test/device/sm50_simt_plus_multiplies_ssrgemm_tn_t.cu index e15d682..39e2616 100644 --- a/test/device/sm50_simt_plus_multiplies_ssrgemm_tn_t.cu +++ b/test/device/sm50_simt_plus_multiplies_ssrgemm_tn_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_plus_multiplies_ssrgemm_tt_n.cu b/test/device/sm50_simt_plus_multiplies_ssrgemm_tt_n.cu index ddf8323..5216bf3 100644 --- a/test/device/sm50_simt_plus_multiplies_ssrgemm_tt_n.cu +++ b/test/device/sm50_simt_plus_multiplies_ssrgemm_tt_n.cu @@ -38,9 +38,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/device/sm50_simt_plus_multiplies_ssrgemm_tt_t.cu b/test/device/sm50_simt_plus_multiplies_ssrgemm_tt_t.cu index 1cacc99..759c2aa 100644 --- a/test/device/sm50_simt_plus_multiplies_ssrgemm_tt_t.cu +++ b/test/device/sm50_simt_plus_multiplies_ssrgemm_tt_t.cu @@ -38,9 +38,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 8x32x8_8x32x1_2x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -74,9 +74,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 16x32x8_16x32x1_4x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -110,9 +110,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 16x64x8_16x64x1_4x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -146,9 +146,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 32x32x8_32x32x1_8x4_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -182,9 +182,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 32x64x8_32x64x1_8x8_4x8_1x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -218,9 +218,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 64x32x8_64x32x1_8x8_8x4_1x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -254,9 +254,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 8x32x8_8x16x1_2x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -290,9 +290,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 8x64x8_8x32x1_2x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -326,9 +326,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 16x32x8_16x16x1_4x2_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -362,9 +362,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 16x64x8_16x32x1_4x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -398,9 +398,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 16x128x8_16x64x1_4x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -434,9 +434,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 32x32x8_32x16x1_4x4_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -470,9 +470,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 32x64x8_32x32x1_8x4_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -506,9 +506,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 32x128x8_32x64x1_8x8_4x8_1x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -542,9 +542,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 64x64x8_64x32x1_8x8_8x4_1x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -578,9 +578,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 32x32x8_16x32x1_4x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -614,9 +614,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 64x32x8_32x32x1_8x4_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -650,9 +650,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 64x64x8_32x64x1_8x8_4x8_2x1) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -686,9 +686,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 128x32x8_64x32x1_8x8_8x4_2x1) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -722,9 +722,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 16x32x8_8x16x1_2x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -758,9 +758,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 16x64x8_8x32x1_2x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -794,9 +794,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 32x32x8_16x16x1_4x2_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -830,9 +830,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 32x64x8_16x32x1_4x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -866,9 +866,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 32x128x8_16x64x1_4x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -902,9 +902,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 64x32x8_32x16x1_4x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -938,9 +938,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 64x64x8_32x32x1_8x4_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -974,9 +974,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 64x128x8_32x64x1_8x8_4x8_2x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1010,9 +1010,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 128x32x8_64x16x1_8x4_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1046,9 +1046,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 128x64x8_64x32x1_8x8_8x4_2x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1082,9 +1082,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 16x64x16_8x16x1_2x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1118,9 +1118,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 16x128x16_8x32x1_2x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1154,9 +1154,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 32x32x8_16x8x1_2x2_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1190,9 +1190,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 32x64x8_16x16x1_4x2_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1226,9 +1226,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 32x128x8_16x32x1_4x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1262,9 +1262,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 32x256x8_16x64x1_4x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1298,9 +1298,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 64x64x8_32x16x1_4x4_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1334,9 +1334,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 64x128x8_32x32x1_8x4_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1370,9 +1370,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 64x256x8_32x64x1_8x8_4x8_2x4) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1406,9 +1406,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 128x128x8_64x32x1_8x8_8x4_2x4) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1442,9 +1442,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 32x32x8_8x16x1_2x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1478,9 +1478,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 64x32x8_16x16x1_4x2_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1514,9 +1514,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 64x64x8_16x32x1_4x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1550,9 +1550,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 128x32x8_32x16x1_4x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1586,9 +1586,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 128x64x8_32x32x1_8x4_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1622,9 +1622,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 128x128x8_32x64x1_8x8_4x8_4x2) { using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1658,9 +1658,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 256x32x8_64x16x1_8x4_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1694,9 +1694,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 256x64x8_64x32x1_8x8_8x4_4x2) { using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1730,9 +1730,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 32x64x16_8x16x1_2x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 16, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1766,9 +1766,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 32x128x16_8x32x1_2x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<8, 32, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1802,9 +1802,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 64x32x16_16x8x1_2x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1838,9 +1838,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 64x64x8_16x16x1_4x2_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1874,9 +1874,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 64x128x8_16x32x1_4x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1910,9 +1910,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 64x256x8_16x64x1_4x8_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1946,9 +1946,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 128x32x16_32x8x1_4x2_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 8, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -1982,9 +1982,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 128x64x8_32x16x1_4x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2018,9 +2018,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 128x128x8_32x32x1_8x4_4x8_4x4) { using WarpShape = cutlass::gemm::GemmShape<32, 32, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; @@ -2054,9 +2054,9 @@ TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, 256x64x8_64x16x1_8x4_8x4_4x4) { using WarpShape = cutlass::gemm::GemmShape<64, 16, 8>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; - using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< // - precision, precision, precision, precision, OpClass, // - cuasr::plus, cuasr::multiplies, SmArch>; + using Config = typename cuasr::gemm::device::DefaultSemiRingConfiguration< + precision, precision, precision, precision, + cuasr::plus, cuasr::multiplies, OpClass, SmArch>; using AddOp = Config::AdditionOp; using MultOp = Config::MultiplicationOp; diff --git a/test/regress/src/cutlass_srgemm.cu b/test/regress/src/cutlass_srgemm.cu index 9a775c7..5b05007 100644 --- a/test/regress/src/cutlass_srgemm.cu +++ b/test/regress/src/cutlass_srgemm.cu @@ -29,8 +29,8 @@ auto cutlass_srsgemm_nn( using OperatorClass = cutlass::arch::OpClassSimt; using SmArch = cutlass::arch::Sm50; using TropicalConfig = typename cuasr::gemm::device::DefaultSemiRingConfiguration< - float, float, float, float, OperatorClass, cuasr::minimum, - cuasr::plus, SmArch>; + float, float, float, float, + cuasr::minimum, cuasr::plus, OperatorClass, SmArch>; using AdditionOp = TropicalConfig::AdditionOp; using MultiplicationOp = TropicalConfig::MultiplicationOp; From 4de2c56c643655ec2c6d89f379ae977b15639e55 Mon Sep 17 00:00:00 2001 From: Void Date: Wed, 3 Nov 2021 08:13:19 -0400 Subject: [PATCH 09/15] Add initial Ampere multi-stage templates --- .../device/default_srgemm_configuration.h | 210 +++++ include/cuasr/gemm/kernel/default_srgemm.h | 107 ++- .../cuasr/gemm/threadblock/default_srmma.h | 80 ++ .../gemm/threadblock/default_srmma_core.h | 2 + .../threadblock/default_srmma_core_sm80.h | 721 ++++++++++++++++++ .../cuasr/gemm/threadblock/srmma_multistage.h | 607 +++++++++++++++ include/cuasr/gemm/warp/srmma_simt.h | 13 + 7 files changed, 1739 insertions(+), 1 deletion(-) create mode 100644 include/cuasr/gemm/threadblock/default_srmma_core_sm80.h create mode 100644 include/cuasr/gemm/threadblock/srmma_multistage.h diff --git a/include/cuasr/gemm/device/default_srgemm_configuration.h b/include/cuasr/gemm/device/default_srgemm_configuration.h index 9237353..73665e1 100644 --- a/include/cuasr/gemm/device/default_srgemm_configuration.h +++ b/include/cuasr/gemm/device/default_srgemm_configuration.h @@ -280,6 +280,216 @@ struct DefaultSemiRingConfiguration< /////////////////////////////////// SM 80 ////////////////////////////////////// //////////////////////////////////////////////////////////////////////////////// +// Plus-Times semi-ring GEMM configuration +// this is the traditional GEMM +template +struct DefaultSemiRingConfiguration< + Element, + Element, + Element, + Element, + cuasr::plus, + cuasr::multiplies, + cutlass::arch::OpClassSimt, + cutlass::arch::Sm80> { + + static int constexpr kAlignmentA = 1; + static int constexpr kAlignmentB = 1; + using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 8>; + using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; + using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; + static int constexpr kStages = 3; + + using AdditionOp = cuasr::plus; + using MultiplicationOp = cuasr::multiplies; + + using EpilogueOutputOp = cuasr::epilogue::thread::SemiringLinearCombination< + AdditionOp, MultiplicationOp, Element, 1>; +}; + +// Min-Plus (tropical) semi-ring GEMM configuration +// example application: All Pairs Shorted Path +template +struct DefaultSemiRingConfiguration< + Element, + Element, + Element, + Element, + cuasr::minimum, + cuasr::plus, + cutlass::arch::OpClassSimt, + cutlass::arch::Sm80> { + + static int constexpr kAlignmentA = 1; + static int constexpr kAlignmentB = 1; + using ThreadblockShape = cutlass::gemm::GemmShape<128, 128, 8>; + using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; + using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; + static int constexpr kStages = 3; + + using AdditionOp = cuasr::minimum; + using MultiplicationOp = cuasr::plus; + + using EpilogueOutputOp = cuasr::epilogue::thread::SemiringLinearCombination< + AdditionOp, MultiplicationOp, Element, 1>; +}; + +// Max-Plus semi-ring GEMM configuration +// example application: Viterbi algorithm +template +struct DefaultSemiRingConfiguration< + Element, + Element, + Element, + Element, + cuasr::maximum, + cuasr::plus, + cutlass::arch::OpClassSimt, + cutlass::arch::Sm80> { + + static int constexpr kAlignmentA = 1; + static int constexpr kAlignmentB = 1; + using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 8>; + using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; + using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; + static int constexpr kStages = 3; + + using AdditionOp = cuasr::maximum; + using MultiplicationOp = cuasr::plus; + + using EpilogueOutputOp = cuasr::epilogue::thread::SemiringLinearCombination< + AdditionOp, MultiplicationOp, Element, 1>; +}; + +// Max-Min +template +struct DefaultSemiRingConfiguration< + Element, + Element, + Element, + Element, + cuasr::maximum, + cuasr::minimum, + cutlass::arch::OpClassSimt, + cutlass::arch::Sm80> { + + static int constexpr kAlignmentA = 1; + static int constexpr kAlignmentB = 1; + using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 8>; + using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; + using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; + static int constexpr kStages = 3; + + using AdditionOp = cuasr::maximum; + using MultiplicationOp = cuasr::minimum; + + using EpilogueOutputOp = cuasr::epilogue::thread::SemiringLinearCombination< + AdditionOp, MultiplicationOp, Element, 1>; +}; + +// Min-Max +template +struct DefaultSemiRingConfiguration< + Element, + Element, + Element, + Element, + cuasr::minimum, + cuasr::maximum, + cutlass::arch::OpClassSimt, + cutlass::arch::Sm80> { + + static int constexpr kAlignmentA = 1; + static int constexpr kAlignmentB = 1; + using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 8>; + using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; + using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; + static int constexpr kStages = 3; + + using AdditionOp = cuasr::minimum; + using MultiplicationOp = cuasr::maximum; + + using EpilogueOutputOp = cuasr::epilogue::thread::SemiringLinearCombination< + AdditionOp, MultiplicationOp, Element, 1>; +}; + +// Min-Times +template +struct DefaultSemiRingConfiguration< + Element, + Element, + Element, + Element, + cuasr::minimum, + cuasr::multiplies, + cutlass::arch::OpClassSimt, + cutlass::arch::Sm80> { + + static int constexpr kAlignmentA = 1; + static int constexpr kAlignmentB = 1; + using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 8>; + using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; + using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; + static int constexpr kStages = 3; + + using AdditionOp = cuasr::minimum; + using MultiplicationOp = cuasr::multiplies; + + using EpilogueOutputOp = cuasr::epilogue::thread::SemiringLinearCombination< + AdditionOp, MultiplicationOp, Element, 1>; +}; + +// Max-Times +template +struct DefaultSemiRingConfiguration< + Element, + Element, + Element, + Element, + cuasr::maximum, + cuasr::multiplies, + cutlass::arch::OpClassSimt, + cutlass::arch::Sm80> { + + static int constexpr kAlignmentA = 1; + static int constexpr kAlignmentB = 1; + using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 8>; + using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; + using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; + static int constexpr kStages = 3; + + using AdditionOp = cuasr::maximum; + using MultiplicationOp = cuasr::multiplies; + + using EpilogueOutputOp = cuasr::epilogue::thread::SemiringLinearCombination< + AdditionOp, MultiplicationOp, Element, 1>; +}; + +// Or-And boolean ring +template +struct DefaultSemiRingConfiguration< + Element, + Element, + Element, + Element, + cuasr::binary_or, + cuasr::binary_and, + cutlass::arch::OpClassSimt, + cutlass::arch::Sm80> { + + static int constexpr kAlignmentA = 1; + static int constexpr kAlignmentB = 1; + using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 8>; + using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; + using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; + static int constexpr kStages = 3; + + using AdditionOp = cuasr::binary_or; + using MultiplicationOp = cuasr::binary_and; + + using EpilogueOutputOp = cuasr::epilogue::thread::SemiringLinearCombination< + AdditionOp, MultiplicationOp, Element, 1>; +}; } // namespace device } // namespace gemm diff --git a/include/cuasr/gemm/kernel/default_srgemm.h b/include/cuasr/gemm/kernel/default_srgemm.h index 561b653..b85d2d9 100644 --- a/include/cuasr/gemm/kernel/default_srgemm.h +++ b/include/cuasr/gemm/kernel/default_srgemm.h @@ -79,9 +79,15 @@ template < int Stages, /// If true, kernel is configured to support serial reduction in the /// epilogue - bool SplitKSerial> + bool SplitKSerial, + /// Use zfill or predicate for out-of-bound cp.async + cutlass::gemm::SharedMemoryClearOption SharedMemoryClear + = cutlass::gemm::SharedMemoryClearOption::kNone> struct DefaultSrgemm; +//////////////////////////////////////////////////////////////////////////////// + +// SM50 SIMT Two Stage template < /// Element type for A matrix operand typename ElementA, @@ -180,6 +186,105 @@ struct DefaultSrgemm< //////////////////////////////////////////////////////////////////////////////// +// SM80 SIMT Multi Stage +template < + /// Element type for A matrix operand + typename ElementA, + /// Layout type for A matrix operand + typename LayoutA, + /// Access granularity of A matrix in units of elements + int kAlignmentA, + /// Element type for B matrix operand + typename ElementB, + /// Layout type for B matrix operand + typename LayoutB, + /// Access granularity of A matrix in units of elements + int kAlignmentB, + /// Element type for C and D matrix operands + typename ElementC, + /// Element type for internal accumulation + typename ElementAccumulator, + /// Threadblock-level tile size (concept: GemmShape) + typename ThreadblockShape, + /// Warp-level tile size (concept: GemmShape) + typename WarpShape, + /// Addition operator of the semi-ring + typename AdditionOp, + /// Multiplication operator of the semi-ring + typename MultiplicationOp, + /// Epilogue output operator + typename EpilogueOutputOp, + /// Threadblock-level swizzling operator + typename ThreadblockSwizzle, + /// Number of stages used in the pipelined mainloop + int Stages, + /// If true, kernel is configured to support serial reduction in the epilogue + bool SplitKSerial +> +struct DefaultSrgemm< + ElementA, + LayoutA, + kAlignmentA, + ElementB, + LayoutB, + kAlignmentB, + ElementC, + cutlass::layout::RowMajor, + ElementAccumulator, + cutlass::arch::OpClassSimt, + cutlass::arch::Sm80, + ThreadblockShape, + WarpShape, + cutlass::gemm::GemmShape<1, 1, 1>, + AdditionOp, + MultiplicationOp, + EpilogueOutputOp, + ThreadblockSwizzle, + Stages, + SplitKSerial> { + /// Define the threadblock-scoped matrix multiply-accumulate + using Srmma = typename cuasr::gemm::threadblock::DefaultSrmma< + ElementA, + LayoutA, + kAlignmentA, + ElementB, + LayoutB, + kAlignmentB, + ElementAccumulator, + cutlass::layout::RowMajor, + cutlass::arch::OpClassSimt, + cutlass::arch::Sm80, + ThreadblockShape, + WarpShape, + cutlass::gemm::GemmShape<1, 1, 1>, + AdditionOp, + MultiplicationOp, + Stages>::ThreadblockSrmma; + + static int const kEpilogueElementsPerAccess = EpilogueOutputOp::kCount; + static_assert(kEpilogueElementsPerAccess == 1, "simt epilogue must operate on scalars"); + + /// Define the epilogue + using Epilogue = typename cutlass::epilogue::threadblock::DefaultEpilogueSimt< + ThreadblockShape, + typename Srmma::Operator, + EpilogueOutputOp, + kEpilogueElementsPerAccess + >::Epilogue; + + /// Define the kernel-level GEMM operator. + using SrgemmKernel = cuasr::gemm::kernel::Srgemm< + Srmma, + AdditionOp, + MultiplicationOp, + Epilogue, + ThreadblockSwizzle, + SplitKSerial + >; +}; + +//////////////////////////////////////////////////////////////////////////////// + } // namespace kernel } // namespace gemm } // namespace cuasr diff --git a/include/cuasr/gemm/threadblock/default_srmma.h b/include/cuasr/gemm/threadblock/default_srmma.h index 2435e65..147a1b0 100644 --- a/include/cuasr/gemm/threadblock/default_srmma.h +++ b/include/cuasr/gemm/threadblock/default_srmma.h @@ -124,6 +124,86 @@ struct DefaultSrmma; }; +//////////////////////////////////////////////////////////////////////////////// + +/// Specialization for row-major output multi-stage (OperatorClass Simt) +template < + /// Element type for A matrix operand + typename ElementA, + /// Layout type for A matrix operand + typename LayoutA, + /// Access granularity of A matrix in units of elements + int kAlignmentA, + /// Element type for B matrix operand + typename ElementB, + /// Layout type for B matrix operand + typename LayoutB, + /// Access granularity of B matrix in units of elements + int kAlignmentB, + /// Element type for internal accumulation + typename ElementAccumulator, + /// Tag indicating architecture to tune for + typename ArchTag, + /// Threadblock-level tile size (concept: GemmShape) + typename ThreadblockShape, + /// Warp-level tile size (concept: GemmShape) + typename WarpShape, + /// Instruction-level tile size (concept: GemmShape) + typename InstructionShape, + /// Number of stages used in the multistage mainloop + int Stages, + /// Addition operator of the semi-ring + typename AdditionOp, + /// Multiplication operator of the semi-ring + typename MultiplicationOp> +struct DefaultSrmma { + + static cutlass::arch::CacheOperation::Kind const CacheOpA = + ((cutlass::sizeof_bits::value * kAlignmentA) == 128) + ? cutlass::arch::CacheOperation::Global + : cutlass::arch::CacheOperation::Always; + + static cutlass::arch::CacheOperation::Kind const CacheOpB = + ((cutlass::sizeof_bits::value * kAlignmentB) == 128) + ? cutlass::arch::CacheOperation::Global + : cutlass::arch::CacheOperation::Always; + + // Define the SrmmaCore components + using SrmmaCore = typename cuasr::gemm::threadblock::DefaultSrmmaCore< + ThreadblockShape, WarpShape, InstructionShape, ElementA, LayoutA, + ElementB, LayoutB, ElementAccumulator, cutlass::layout::RowMajor, + cutlass::arch::OpClassSimt, AdditionOp, MultiplicationOp, Stages, CacheOpA, CacheOpB>; + + // Define iterators over tiles from the A operand + using ThreadMapA = typename SrmmaCore::IteratorThreadMapA; + using AccessTypeA = cutlass::Array; + using IteratorA = + cutlass::transform::threadblock::PredicatedTileAccessIterator< + cutlass::MatrixShape, + ElementA, LayoutA, 1, ThreadMapA, AccessTypeA>; + + // Define iterators over tiles from the B operand + using ThreadMapB = typename SrmmaCore::IteratorThreadMapB; + using AccessTypeB = cutlass::Array; + using IteratorB = + cutlass::transform::threadblock::PredicatedTileAccessIterator< + cutlass::MatrixShape, + ElementB, LayoutB, 0, ThreadMapB, AccessTypeB>; + + // Define the threadblock-scoped pipelined matrix multiply + using ThreadblockSrmma = cuasr::gemm::threadblock::SrmmaMultistage< + typename SrmmaCore::Shape, IteratorA, typename SrmmaCore::SmemIteratorA, + SrmmaCore::kCacheOpA, IteratorB, typename SrmmaCore::SmemIteratorB, + SrmmaCore::kCacheOpB, ElementAccumulator, cutlass::layout::RowMajor, + typename SrmmaCore::MmaPolicy, Stages>; +}; + +//////////////////////////////////////////////////////////////////////////////// } // namespace threadblock } // namespace gemm diff --git a/include/cuasr/gemm/threadblock/default_srmma_core.h b/include/cuasr/gemm/threadblock/default_srmma_core.h index 3f69212..4a76c10 100644 --- a/include/cuasr/gemm/threadblock/default_srmma_core.h +++ b/include/cuasr/gemm/threadblock/default_srmma_core.h @@ -20,6 +20,7 @@ #include "cutlass/gemm/warp/mma.h" #include "cuasr/gemm/threadblock/srmma_pipelined.h" +#include "cuasr/gemm/threadblock/srmma_multistage.h" ///////////////////////////////////////////////////////////////////////////////////////////////// @@ -82,3 +83,4 @@ struct DefaultSrmmaCore; } // namespace cuasr #include "cuasr/gemm/threadblock/default_srmma_core_simt.h" +#include "cuasr/gemm/threadblock/default_srmma_core_sm80.h" diff --git a/include/cuasr/gemm/threadblock/default_srmma_core_sm80.h b/include/cuasr/gemm/threadblock/default_srmma_core_sm80.h new file mode 100644 index 0000000..c8c2d72 --- /dev/null +++ b/include/cuasr/gemm/threadblock/default_srmma_core_sm80.h @@ -0,0 +1,721 @@ +/*************************************************************************************************** + * Copyright (c) 2021, Vijay Thakkar. + * Copyright (c) 2017-2021, NVIDIA CORPORATION. All rights reserved. + * + * Redistribution and use in source and binary forms, with or without modification, are permitted + * provided that the following conditions are met: + * * Redistributions of source code must retain the above copyright notice, this list of + * conditions and the following disclaimer. + * * Redistributions in binary form must reproduce the above copyright notice, this list of + * conditions and the following disclaimer in the documentation and/or other materials + * provided with the distribution. + * * Neither the name of the NVIDIA CORPORATION nor the names of its contributors may be used + * to endorse or promote products derived from this software without specific prior written + * permission. + * + * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR + * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND + * FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE + * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, + * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; + * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, + * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE + * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + * + **************************************************************************************************/ + +/*! \file + \brief Defines basic properties needed by CTA-level GEMMs assuming + expectations about data layout of the global memory fragments, data types, + and internal tile sizes. + + Partial specializations for threadblock::Mma operations targeting TensorOp + instructions. +*/ + +#pragma once + +#include "cutlass/array.h" +#include "cutlass/cutlass.h" + +#include "cutlass/gemm/warp/mma_simt_policy.h" +#include "cutlass/gemm/warp/mma_simt.h" + + +#include "cutlass/matrix_shape.h" +#include "cutlass/numeric_types.h" +#include "cutlass/transform/pitch_linear_thread_map.h" +#include "cutlass/transform/threadblock/regular_tile_access_iterator_tensor_op.h" +#include "cutlass/transform/threadblock/regular_tile_access_iterator_tensor_op_sm80.h" +#include "cutlass/transform/threadblock/regular_tile_access_iterator_pitch_linear.h" + +#include "cuasr/gemm/threadblock/default_srmma_core.h" + +//////////////////////////////////////////////////////////////////////////////// + +namespace cuasr { +namespace gemm { +namespace threadblock { + +//////////////////////////////////////////////////////////////////////////////// + +/// Partial specialization for SIMT GEMMs using multistage pipeline. +/// +/// +/// This uses the default warp-level operator given tile sizes +template < + /// Shape of threadblock-scoped matrix multiply operator (concept: + /// GemmShape) + typename Shape_, + /// Shape of warp-level matrix multiply operator (concept: GemmShape) + typename WarpShape_, + /// Shape of one matrix production operation (concept: GemmShape) + typename InstructionShape_, + /// Data type of A operand + typename ElementA_, + /// Data type of B operand + typename ElementB_, + /// Data type of accumulator + typename ElementC_, + /// Layout of accumulator + typename LayoutC_, + /// Addition operator of the semi-ring + typename AdditionOp_, + /// Multiplication operator of the semi-ring + typename MultiplicationOp_, + /// Number of stages + int Stages, + /// Cache operation of operand A + cutlass::arch::CacheOperation::Kind CacheOpA, + /// Cache operation of operand B + cutlass::arch::CacheOperation::Kind CacheOpB> +struct DefaultSrmmaCore { + using Shape = Shape_; + using WarpShape = WarpShape_; + using InstructionShape = InstructionShape_; + using ElementA = ElementA_; + using LayoutA = cutlass::layout::ColumnMajor; + using ElementB = ElementB_; + using LayoutB = cutlass::layout::ColumnMajor; + using ElementC = ElementC_; + using LayoutC = LayoutC_; + using AdditionOp = AdditionOp_; + using MultiplicationOp = MultiplicationOp_; + static int const kStages = Stages; + static cutlass::arch::CacheOperation::Kind const kCacheOpA = cutlass::arch::CacheOperation::Always; + static cutlass::arch::CacheOperation::Kind const kCacheOpB = cutlass::arch::CacheOperation::Always; + + /// Number of warps present + using WarpCount = cutlass::gemm::GemmShape; + + // Divisility requirements + static_assert( + !(Shape::kM % WarpShape::kM) && !(Shape::kN % WarpShape::kN), + "Threadblock-scoped GEMM should be divisible by warp-scoped GEMM size."); + + /// Number of threads per warp + static int const kWarpSize = cutlass::gemm::warp::WarpSize::value; + + /// Number of threads total + static int const kThreads = WarpCount::kCount * kWarpSize; + + // Warp thread arrangement + static int const kElementsPerAccess = 1; + + // + // Shared memory layouts + // + + using SmemLayoutA = cutlass::layout::ColumnMajor; + + // Shared memory layout + using SmemLayoutB = cutlass::layout::RowMajor; + + // + // Iterators to write to shared memory + // + + + /// ThreadMap of iterator A + using IteratorThreadMapA = cutlass::transform::PitchLinearStripminedThreadMap< + cutlass::layout::PitchLinearShape, + kThreads, + kElementsPerAccess + >; + + /// Shared memory iterator to A operand + using SmemIteratorA = cutlass::transform::threadblock::RegularTileAccessIterator< + cutlass::MatrixShape, ElementA, SmemLayoutA, 0, + IteratorThreadMapA>; + + /// Policy of iterator B + using IteratorThreadMapB = cutlass::transform::PitchLinearStripminedThreadMap< + cutlass::layout::PitchLinearShape, + kThreads, + kElementsPerAccess + >; + + /// Transpose the ThreadMap of iterator B + using SmemThreadMapB = cutlass::transform::TransposePitchLinearThreadMapSimt; + + /// Shared memory iterator to B operand + using SmemIteratorB = cutlass::transform::threadblock::RegularTileAccessIterator< + cutlass::MatrixShape, ElementB, SmemLayoutB, 1, + SmemThreadMapB>; + + // + // Warp-level matrix multiply operator + // + + // Define the warp-level op + static const int WarpNumThreadsM = 4; // TODO need to extract these from template data + static const int WarpNumThreadsN = 8; + static_assert(!(WarpShape::kM % WarpNumThreadsM) && !(WarpShape::kN % WarpNumThreadsN), + "WarpShape must be divisible by ThreadTile shape."); + static const int ThreadTileM = WarpShape::kM / WarpNumThreadsM; + static const int ThreadTileN = WarpShape::kN / WarpNumThreadsN; + static const int LaneLayout = ThreadTileM > 4 && ThreadTileN > 4 ? 2 : 1; + static const int numElementsA = 128 / cutlass::sizeof_bits::value; + static const int numElementsB = 128 / cutlass::sizeof_bits::value; + static const int LaneM = cutlass::const_min(numElementsA, ThreadTileM); + static const int LaneN = cutlass::const_min(numElementsB, ThreadTileN); + + static_assert(!((Shape::kK / 32) % LaneN), + "Padding must be divisible by Lane"); + + // these should have max of thread tile also + using LaneMmaShape = cutlass::gemm::GemmShape< + LaneM, + LaneN, + 1>; + + using Policy = cutlass::gemm::warp::MmaSimtPolicy< + cutlass::MatrixShape, // WarpShape + cutlass::layout::RowMajorInterleaved, // LaneLayout + LaneMmaShape + >; + + using MmaWarpSimt = cuasr::gemm::warp::SrmmaSimt< + WarpShape, /// Size of the Gemm problem - concept: gemm::GemmShape<> 128, 128, 8 + ElementA, /// Data type of A elements + SmemLayoutA, /// Layout of A matrix (concept: MatrixLayout) + ElementB, /// Data type of B elements + SmemLayoutB, /// Layout of B matrix (concept: MatrixLayout) + ElementC, /// Element type of C matrix + LayoutC, /// Layout of C matrix (concept: MatrixLayout) + Policy, /// Policy describing warp-level MmaSimtOp (concept: MmaSimtOp policy) + AdditionOp, /// Addition operator of the semi-ring + MultiplicationOp /// Multiplication operator of the semi-ring + >; + + /// Policy used to define MmaPipelined + using MmaPolicy = cutlass::gemm::threadblock::MmaPolicy< + MmaWarpSimt, + cutlass::MatrixShape<0, 0>, + cutlass::MatrixShape<0, Shape::kK / 32>, + WarpCount::kK + >; +}; + +/// Partial specialization for SIMT GEMMs using multistage pipeline. +/// +/// +/// This uses the default warp-level operator given tile sizes +template < + /// Shape of threadblock-scoped matrix multiply operator (concept: + /// GemmShape) + typename Shape_, + /// Shape of warp-level matrix multiply operator (concept: GemmShape) + typename WarpShape_, + /// Shape of one matrix production operation (concept: GemmShape) + typename InstructionShape_, + /// Data type of A operand + typename ElementA_, + /// Data type of B operand + typename ElementB_, + /// Data type of accumulator + typename ElementC_, + /// Layout of accumulator + typename LayoutC_, + /// Addition operator of the semi-ring + typename AdditionOp_, + /// Multiplication operator of the semi-ring + typename MultiplicationOp_, + /// Number of stages + int Stages, + /// Cache operation of operand A + cutlass::arch::CacheOperation::Kind CacheOpA, + /// Cache operation of operand B + cutlass::arch::CacheOperation::Kind CacheOpB> +struct DefaultSrmmaCore { + using Shape = Shape_; + using WarpShape = WarpShape_; + using InstructionShape = InstructionShape_; + using ElementA = ElementA_; + using LayoutA = cutlass::layout::ColumnMajor; + using ElementB = ElementB_; + using LayoutB = cutlass::layout::RowMajor; + using ElementC = ElementC_; + using LayoutC = LayoutC_; + using AdditionOp = AdditionOp_; + using MultiplicationOp = MultiplicationOp_; + static int const kStages = Stages; + static cutlass::arch::CacheOperation::Kind const kCacheOpA = cutlass::arch::CacheOperation::Always; + static cutlass::arch::CacheOperation::Kind const kCacheOpB = cutlass::arch::CacheOperation::Always; + + /// Number of warps present + using WarpCount = cutlass::gemm::GemmShape; + + // Divisility requirements + static_assert( + !(Shape::kM % WarpShape::kM) && !(Shape::kN % WarpShape::kN), + "Threadblock-scoped GEMM should be divisible by warp-scoped GEMM size."); + + /// Number of threads per warp + static int const kWarpSize = cutlass::gemm::warp::WarpSize::value; + + /// Number of threads total + static int const kThreads = WarpCount::kCount * kWarpSize; + + // Warp thread arrangement + static int const kElementsPerAccess = 1; + + // + // Shared memory layouts + // + + using SmemLayoutA = cutlass::layout::ColumnMajor; + + // Shared memory layout + using SmemLayoutB = cutlass::layout::RowMajor; + + // + // Iterators to write to shared memory + // + + + /// ThreadMap of iterator A + using IteratorThreadMapA = cutlass::transform::PitchLinearStripminedThreadMap< + cutlass::layout::PitchLinearShape, + kThreads, + kElementsPerAccess + >; + + /// Shared memory iterator to A operand + using SmemIteratorA = cutlass::transform::threadblock::RegularTileAccessIterator< + cutlass::MatrixShape, ElementA, SmemLayoutA, 0, + IteratorThreadMapA>; + + /// Policy of iterator B + using IteratorThreadMapB = cutlass::transform::PitchLinearStripminedThreadMap< + cutlass::layout::PitchLinearShape, + kThreads, + kElementsPerAccess + >; + + /// Shared memory iterator to B operand + using SmemIteratorB = cutlass::transform::threadblock::RegularTileAccessIterator< + cutlass::MatrixShape, ElementB, SmemLayoutB, 1, + IteratorThreadMapB>; + + // + // Warp-level matrix multiply operator + // + + // Define the warp-level op + static const int WarpNumThreadsM = 4; // TODO need to extract these from template data + static const int WarpNumThreadsN = 8; + static_assert(!(WarpShape::kM % WarpNumThreadsM) && !(WarpShape::kN % WarpNumThreadsN), + "WarpShape must be divisible by ThreadTile shape."); + static const int ThreadTileM = WarpShape::kM / WarpNumThreadsM; + static const int ThreadTileN = WarpShape::kN / WarpNumThreadsN; + static const int LaneLayout = ThreadTileM > 4 && ThreadTileN > 4 ? 2 : 1; + static const int numElementsA = 128 / cutlass::sizeof_bits::value; + static const int numElementsB = 128 / cutlass::sizeof_bits::value; + static const int LaneM = cutlass::const_min(numElementsA, ThreadTileM); + static const int LaneN = cutlass::const_min(numElementsB, ThreadTileN); + + // these should have max of thread tile also + using LaneMmaShape = cutlass::gemm::GemmShape< + LaneM, + LaneN, + 1>; + + using Policy = cutlass::gemm::warp::MmaSimtPolicy< + cutlass::MatrixShape, // WarpShape + cutlass::layout::RowMajorInterleaved, // LaneLayout + LaneMmaShape + >; + + using MmaWarpSimt = cuasr::gemm::warp::SrmmaSimt< + WarpShape, /// Size of the Gemm problem - concept: gemm::GemmShape<> 128, 128, 8 + ElementA, /// Data type of A elements + SmemLayoutA, /// Layout of A matrix (concept: MatrixLayout) + ElementB, /// Data type of B elements + SmemLayoutB, /// Layout of B matrix (concept: MatrixLayout) + ElementC, /// Element type of C matrix + LayoutC, /// Layout of C matrix (concept: MatrixLayout) + Policy, /// Policy describing warp-level MmaSimtOp (concept: MmaSimtOp policy) + AdditionOp, /// Addition operator of the semi-ring + MultiplicationOp /// Multiplication operator of the semi-ring + >; + + /// Policy used to define MmaPipelined + using MmaPolicy = cutlass::gemm::threadblock::MmaPolicy< + MmaWarpSimt, + cutlass::MatrixShape<0, 0>, + cutlass::MatrixShape<0, 0>, + WarpCount::kK + >; +}; + +/// Partial specialization for SIMGEMMsT using multistage pipeline. +/// +/// +/// This uses the default warp-level operator given tile sizes +template < + /// Shape of threadblock-scoped matrix multiply operator (concept: + /// GemmShape) + typename Shape_, + /// Shape of warp-level matrix multiply operator (concept: GemmShape) + typename WarpShape_, + /// Shape of one matrix production operation (concept: GemmShape) + typename InstructionShape_, + /// Data type of A operand + typename ElementA_, + /// Data type of B operand + typename ElementB_, + /// Data type of accumulator + typename ElementC_, + /// Layout of accumulator + typename LayoutC_, + /// Addition operator of the semi-ring + typename AdditionOp_, + /// Multiplication operator of the semi-ring + typename MultiplicationOp_, + /// Number of stages + int Stages, + /// Cache operation of operand A + cutlass::arch::CacheOperation::Kind CacheOpA, + /// Cache operation of operand B + cutlass::arch::CacheOperation::Kind CacheOpB> +struct DefaultSrmmaCore { + using Shape = Shape_; + using WarpShape = WarpShape_; + using InstructionShape = InstructionShape_; + using ElementA = ElementA_; + using LayoutA = cutlass::layout::RowMajor; + using ElementB = ElementB_; + using LayoutB = cutlass::layout::ColumnMajor; + using ElementC = ElementC_; + using LayoutC = LayoutC_; + using AdditionOp = AdditionOp_; + using MultiplicationOp = MultiplicationOp_; + static int const kStages = Stages; + static cutlass::arch::CacheOperation::Kind const kCacheOpA = cutlass::arch::CacheOperation::Always; + static cutlass::arch::CacheOperation::Kind const kCacheOpB = cutlass::arch::CacheOperation::Always; + + /// Number of warps present + using WarpCount = cutlass::gemm::GemmShape; + + // Divisility requirements + static_assert( + !(Shape::kM % WarpShape::kM) && !(Shape::kN % WarpShape::kN), + "Threadblock-scoped GEMM should be divisible by warp-scoped GEMM size."); + + /// Number of threads per warp + static int const kWarpSize = cutlass::gemm::warp::WarpSize::value; + + /// Number of threads total + static int const kThreads = WarpCount::kCount * kWarpSize; + + // Warp thread arrangement + static int const kElementsPerAccess = 1; + + // + // Shared memory layouts + // + + using SmemLayoutA = cutlass::layout::ColumnMajor; + + // Shared memory layout + using SmemLayoutB = cutlass::layout::RowMajor; + + // + // Iterators to write to shared memory + // + + + /// ThreadMap of iterator A + using IteratorThreadMapA = cutlass::transform::PitchLinearStripminedThreadMap< + cutlass::layout::PitchLinearShape, + kThreads, + kElementsPerAccess + >; + + /// Transpose the ThreadMap of iterator A + using SmemThreadMapA = cutlass::transform::TransposePitchLinearThreadMapSimt; + + /// Shared memory iterator to A operand + using SmemIteratorA = cutlass::transform::threadblock::RegularTileAccessIterator< + cutlass::MatrixShape, ElementA, SmemLayoutA, 0, + SmemThreadMapA>; + + /// Policy of iterator B + using IteratorThreadMapB = cutlass::transform::PitchLinearStripminedThreadMap< + cutlass::layout::PitchLinearShape, + kThreads, + kElementsPerAccess + >; + + /// Transpose the ThreadMap of iterator B + using SmemThreadMapB = cutlass::transform::TransposePitchLinearThreadMapSimt; + + /// Shared memory iterator to B operand + using SmemIteratorB = cutlass::transform::threadblock::RegularTileAccessIterator< + cutlass::MatrixShape, ElementB, SmemLayoutB, 1, + SmemThreadMapB>; + + // + // Warp-level matrix multiply operator + // + + // Define the warp-level op + static const int WarpNumThreadsM = 4; // TODO need to extract these from template data + static const int WarpNumThreadsN = 8; + static_assert(!(WarpShape::kM % WarpNumThreadsM) && !(WarpShape::kN % WarpNumThreadsN), + "WarpShape must be divisible by ThreadTile shape."); + static const int ThreadTileM = WarpShape::kM / WarpNumThreadsM; + static const int ThreadTileN = WarpShape::kN / WarpNumThreadsN; + static const int LaneLayout = ThreadTileM > 4 && ThreadTileN > 4 ? 2 : 1; + static const int numElementsA = 128 / cutlass::sizeof_bits::value; + static const int numElementsB = 128 / cutlass::sizeof_bits::value; + static const int LaneM = cutlass::const_min(numElementsA, ThreadTileM); + static const int LaneN = cutlass::const_min(numElementsB, ThreadTileN); + + static_assert(!((Shape::kK / 32) % LaneM) && !((Shape::kK / 32) % LaneN), + "Padding must be divisible by Lane"); + + // these should have max of thread tile also + using LaneMmaShape = cutlass::gemm::GemmShape< + LaneM, + LaneN, + 1>; + + using Policy = cutlass::gemm::warp::MmaSimtPolicy< + cutlass::MatrixShape, // WarpShape + cutlass::layout::RowMajorInterleaved, // LaneLayout + LaneMmaShape + >; + + using MmaWarpSimt = cuasr::gemm::warp::SrmmaSimt< + WarpShape, /// Size of the Gemm problem - concept: gemm::GemmShape<> 128, 128, 8 + ElementA, /// Data type of A elements + SmemLayoutA, /// Layout of A matrix (concept: MatrixLayout) + ElementB, /// Data type of B elements + SmemLayoutB, /// Layout of B matrix (concept: MatrixLayout) + ElementC, /// Element type of C matrix + LayoutC, /// Layout of C matrix (concept: MatrixLayout) + Policy, /// Policy describing warp-level MmaSimtOp (concept: MmaSimtOp policy) + AdditionOp, /// Addition operator of the semi-ring + MultiplicationOp /// Multiplication operator of the semi-ring + >; + + /// Policy used to define MmaPipelined + using MmaPolicy = cutlass::gemm::threadblock::MmaPolicy< + MmaWarpSimt, + cutlass::MatrixShape, + cutlass::MatrixShape<0, Shape::kK / 32>, + WarpCount::kK + >; +}; + +/// Partial specialization for SIMT GEMMs using multistage pipeline. +/// +/// +/// This uses the default warp-level operator given tile sizes +template < + /// Shape of threadblock-scoped matrix multiply operator (concept: + /// GemmShape) + typename Shape_, + /// Shape of warp-level matrix multiply operator (concept: GemmShape) + typename WarpShape_, + /// Shape of one matrix production operation (concept: GemmShape) + typename InstructionShape_, + /// Data type of A operand + typename ElementA_, + /// Data type of B operand + typename ElementB_, + /// Data type of accumulator + typename ElementC_, + /// Layout of accumulator + typename LayoutC_, + /// Addition operator of the semi-ring + typename AdditionOp_, + /// Multiplication operator of the semi-ring + typename MultiplicationOp_, + /// Number of stages + int Stages, + /// Cache operation of operand A + cutlass::arch::CacheOperation::Kind CacheOpA, + /// Cache operation of operand B + cutlass::arch::CacheOperation::Kind CacheOpB> +struct DefaultSrmmaCore { + using Shape = Shape_; + using WarpShape = WarpShape_; + using InstructionShape = InstructionShape_; + using ElementA = ElementA_; + using LayoutA = cutlass::layout::RowMajor; + using ElementB = ElementB_; + using LayoutB = cutlass::layout::RowMajor; + using ElementC = ElementC_; + using LayoutC = LayoutC_; + using AdditionOp = AdditionOp_; + using MultiplicationOp = MultiplicationOp_; + static int const kStages = Stages; + static cutlass::arch::CacheOperation::Kind const kCacheOpA = cutlass::arch::CacheOperation::Always; + static cutlass::arch::CacheOperation::Kind const kCacheOpB = cutlass::arch::CacheOperation::Always; + + /// Number of warps present + using WarpCount = cutlass::gemm::GemmShape; + + // Divisility requirements + static_assert( + !(Shape::kM % WarpShape::kM) && !(Shape::kN % WarpShape::kN), + "Threadblock-scoped GEMM should be divisible by warp-scoped GEMM size."); + + /// Number of threads per warp + static int const kWarpSize = cutlass::gemm::warp::WarpSize::value; + + /// Number of threads total + static int const kThreads = WarpCount::kCount * kWarpSize; + + // Warp thread arrangement + static int const kElementsPerAccess = 1; + + // + // Shared memory layouts + // + + using SmemLayoutA = cutlass::layout::ColumnMajor; + + // Shared memory layout + using SmemLayoutB = cutlass::layout::RowMajor; + + // + // Iterators to write to shared memory + // + + /// ThreadMap of iterator A + using IteratorThreadMapA = cutlass::transform::PitchLinearStripminedThreadMap< + cutlass::layout::PitchLinearShape, + kThreads, + kElementsPerAccess + >; + + /// Transpose the ThreadMap of iterator A + using SmemThreadMapA = cutlass::transform::TransposePitchLinearThreadMapSimt; + + /// Shared memory iterator to A operand + using SmemIteratorA = cutlass::transform::threadblock::RegularTileAccessIterator< + cutlass::MatrixShape, ElementA, SmemLayoutA, 0, + SmemThreadMapA>; + + /// Policy of iterator B + using IteratorThreadMapB = cutlass::transform::PitchLinearStripminedThreadMap< + cutlass::layout::PitchLinearShape, + kThreads, + kElementsPerAccess + >; + + /// Shared memory iterator to B operand + using SmemIteratorB = cutlass::transform::threadblock::RegularTileAccessIterator< + cutlass::MatrixShape, ElementB, SmemLayoutB, 1, + IteratorThreadMapB>; + + // + // Warp-level matrix multiply operator + // + + // Define the warp-level op + static const int WarpNumThreadsM = 4; // TODO need to extract these from template data + static const int WarpNumThreadsN = 8; + static_assert(!(WarpShape::kM % WarpNumThreadsM) && !(WarpShape::kN % WarpNumThreadsN), + "WarpShape must be divisible by ThreadTile shape."); + static const int ThreadTileM = WarpShape::kM / WarpNumThreadsM; + static const int ThreadTileN = WarpShape::kN / WarpNumThreadsN; + static const int LaneLayout = ThreadTileM > 4 && ThreadTileN > 4 ? 2 : 1; + static const int numElementsA = 128 / cutlass::sizeof_bits::value; + static const int numElementsB = 128 / cutlass::sizeof_bits::value; + static const int LaneM = cutlass::const_min(numElementsA, ThreadTileM); + static const int LaneN = cutlass::const_min(numElementsB, ThreadTileN); + + static_assert(!((Shape::kK / 32) % LaneM), + "Padding must be divisible by Lane"); + + // these should have max of thread tile also + using LaneMmaShape = cutlass::gemm::GemmShape< + LaneM, + LaneN, + 1>; + + using Policy = cutlass::gemm::warp::MmaSimtPolicy< + cutlass::MatrixShape, // WarpShape + cutlass::layout::RowMajorInterleaved, // LaneLayout + LaneMmaShape + >; + + using MmaWarpSimt = cuasr::gemm::warp::SrmmaSimt< + WarpShape, /// Size of the Gemm problem - concept: gemm::GemmShape<> 128, 128, 8 + ElementA, /// Data type of A elements + SmemLayoutA, /// Layout of A matrix (concept: MatrixLayout) + ElementB, /// Data type of B elements + SmemLayoutB, /// Layout of B matrix (concept: MatrixLayout) + ElementC, /// Element type of C matrix + LayoutC, /// Layout of C matrix (concept: MatrixLayout) + Policy, /// Policy describing warp-level MmaSimtOp (concept: MmaSimtOp policy) + AdditionOp, /// Addition operator of the semi-ring + MultiplicationOp /// Multiplication operator of the semi-ring + >; + + /// Policy used to define MmaPipelined + using MmaPolicy = cutlass::gemm::threadblock::MmaPolicy< + MmaWarpSimt, + cutlass::MatrixShape, + cutlass::MatrixShape<0, 0>, + WarpCount::kK + >; +}; + +//////////////////////////////////////////////////////////////////////////////// + +} // namespace threadblock +} // namespace gemm +} // namespace cuasr diff --git a/include/cuasr/gemm/threadblock/srmma_multistage.h b/include/cuasr/gemm/threadblock/srmma_multistage.h new file mode 100644 index 0000000..dfea1d5 --- /dev/null +++ b/include/cuasr/gemm/threadblock/srmma_multistage.h @@ -0,0 +1,607 @@ +/*************************************************************************************************** + * Copyright (c) 2021, Vijay Thakkar. + * Copyright (c) 2017-2021, NVIDIA CORPORATION. All rights reserved. + * + * Redistribution and use in source and binary forms, with or without modification, are permitted + * provided that the following conditions are met: + * * Redistributions of source code must retain the above copyright notice, this list of + * conditions and the following disclaimer. + * * Redistributions in binary form must reproduce the above copyright notice, this list of + * conditions and the following disclaimer in the documentation and/or other materials + * provided with the distribution. + * * Neither the name of the NVIDIA CORPORATION nor the names of its contributors may be used + * to endorse or promote products derived from this software without specific prior written + * permission. + * + * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR + * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND + * FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE + * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, + * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; + * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, + * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE + * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + * + **************************************************************************************************/ +/*! \file + \brief Template for a double-buffered threadblock-scoped GEMM kernel. +*/ + +#pragma once + +#include "cutlass/aligned_buffer.h" +#include "cutlass/arch/memory.h" +#include "cutlass/array.h" +#include "cutlass/cutlass.h" +#include "cutlass/gemm/gemm.h" +#include "cutlass/matrix_shape.h" +#include "cutlass/numeric_types.h" + +#include "cutlass/gemm/threadblock/mma_base.h" + +///////////////////////////////////////////////////////////////////////////////////////////////// + +namespace cuasr { +namespace gemm { +namespace threadblock { + +///////////////////////////////////////////////////////////////////////////////////////////////// + +/// Structure to compute the matrix product targeting CUDA cores and SIMT math +/// instructions. +template < + /// Size of the Gemm problem - concept: gemm::GemmShape<> + typename Shape_, + /// Iterates over tiles of A operand in global memory + // (concept: ReadableTileIterator | ForwardTileIterator | + // MaskedTileIterator) + typename IteratorA_, + /// Iterates over tiles of A operand in shared memory + /// (concept: WriteableTileIterator | RandomAccessTileIterator) + typename SmemIteratorA_, + /// Cache operation for operand A + cutlass::arch::CacheOperation::Kind CacheOpA, + /// Iterates over tiles of B operand in global memory + // (concept: ReadableTileIterator | ForwardTileIterator | + // MaskedTileIterator) + typename IteratorB_, + /// Iterates over tiles of B operand in shared memory + /// (concept: WriteableTileIterator | RandomAccessTileIterator) + typename SmemIteratorB_, + /// Cache operation for operand B + cutlass::arch::CacheOperation::Kind CacheOpB, + /// Data type of accumulator matrix + typename ElementC_, + /// Data type of accumulator matrix + typename LayoutC_, + /// Policy describing tuning details (concept: MmaPolicy) + typename Policy_, + /// Number of stages, + int Stages, + /// Use zfill or predicate for out-of-bound cp.async + cutlass::gemm::SharedMemoryClearOption SharedMemoryClear = cutlass::gemm::SharedMemoryClearOption::kNone, + /// Used for partial specialization + typename Enable = bool> +class SrmmaMultistage : + public cutlass::gemm::threadblock::MmaBase { +public: + ///< Base class + using Base = cutlass::gemm::threadblock::MmaBase; + ///< Size of the Gemm problem - concept: gemm::GemmShape<> + using Shape = Shape_; + ///< Iterates over tiles of A operand in global memory + using IteratorA = IteratorA_; + ///< Iterates over tiles of B operand in global memory + using IteratorB = IteratorB_; + ///< Data type of accumulator matrix + using ElementC = ElementC_; + ///< Layout of accumulator matrix + using LayoutC = LayoutC_; + ///< Policy describing tuning details + using Policy = Policy_; + + using SmemIteratorA = SmemIteratorA_; + using SmemIteratorB = SmemIteratorB_; + + static cutlass::arch::CacheOperation::Kind const kCacheOpA = CacheOpA; + static cutlass::arch::CacheOperation::Kind const kCacheOpB = CacheOpB; + + // + // Dependent types + // + + /// Fragment of accumulator tile + using FragmentC = typename Policy::Operator::FragmentC; + + /// Warp-level Mma + using Operator = typename Policy::Operator; + + /// Minimum architecture is Sm80 to support cp.async + using ArchTag = cutlass::arch::Sm80; + + /// Complex transform on A operand + static cutlass::ComplexTransform const kTransformA = Operator::kTransformA; + + /// Complex transform on B operand + static cutlass::ComplexTransform const kTransformB = Operator::kTransformB; + + /// Internal structure exposed for introspection. + struct Detail { + + static_assert(Base::kWarpGemmIterations > 1, + "The pipelined structure requires at least two warp-level " + "GEMM operations."); + + /// Number of cp.async instructions to load one stage of operand A + static int const AsyncCopyIterationsPerStageA = + IteratorA::ThreadMap::Iterations::kCount; + + /// Number of cp.async instructions to load one stage of operand B + static int const AsyncCopyIterationsPerStageB = + IteratorB::ThreadMap::Iterations::kCount; + + /// Number of stages + static int const kStages = Stages; + + /// Number of cp.async instructions to load on group of operand A + static int const kAccessesPerGroupA = + (AsyncCopyIterationsPerStageA + Base::kWarpGemmIterations - 1) / Base::kWarpGemmIterations; + + /// Number of cp.async instructions to load on group of operand B + static int const kAccessesPerGroupB = + (AsyncCopyIterationsPerStageB + Base::kWarpGemmIterations - 1) / Base::kWarpGemmIterations; + }; + + private: + + using WarpLoadedFragmentA = typename Operator::FragmentA; + using WarpLoadedFragmentB = typename Operator::FragmentB; + using WarpTransformedFragmentA = typename Operator::TransformedFragmentA; + using WarpTransformedFragmentB = typename Operator::TransformedFragmentB; + + private: + + // + // Data members + // + + /// Iterator to write threadblock-scoped tile of A operand to shared memory + SmemIteratorA smem_iterator_A_; + + /// Iterator to write threadblock-scoped tile of B operand to shared memory + SmemIteratorB smem_iterator_B_; + + /// Additive operator's identity value, used to initialize registers and smem + ElementC additive_identity_; + +public: + + /// Construct from tensor references + CUTLASS_DEVICE + SrmmaMultistage( + ///< Shared storage needed for internal use by threadblock-scoped GEMM + typename Base::SharedStorage &shared_storage, + ///< ID within the threadblock + int thread_idx, + ///< ID of warp + int warp_idx, + ///< ID of each thread within a warp + int lane_idx, + ///< Identity value of multiply op + ElementC additive_identity + ): + Base(shared_storage, thread_idx, warp_idx, lane_idx), + smem_iterator_A_(shared_storage.operand_A_ref(), thread_idx), + smem_iterator_B_(shared_storage.operand_B_ref(), thread_idx), + additive_identity_(additive_identity) + { + // Compute warp location within threadblock tile by mapping the warp_id to + // three coordinates: + // _m: the warp's position within the threadblock along the M dimension + // _n: the warp's position within the threadblock along the N dimension + // _k: the warp's position within the threadblock along the K dimension + + int warp_idx_mn = warp_idx % (Base::WarpCount::kM * Base::WarpCount::kN); + int warp_idx_k = warp_idx / (Base::WarpCount::kM * Base::WarpCount::kN); + + int warp_idx_m = warp_idx_mn % Base::WarpCount::kM; + int warp_idx_n = warp_idx_mn / Base::WarpCount::kM; + + // Add per-warp offsets in units of warp-level tiles + this->warp_tile_iterator_A_.add_tile_offset( + {warp_idx_m, Base::kWarpGemmIterations * warp_idx_k}); + this->warp_tile_iterator_B_.add_tile_offset( + {Base::kWarpGemmIterations * warp_idx_k, warp_idx_n}); + } + + CUTLASS_DEVICE + void copy_tiles_and_advance(IteratorA &iterator_A, IteratorB &iterator_B, + int group_start_A = 0, int group_start_B = 0) { + iterator_A.set_iteration_index(group_start_A * + IteratorA::kAccessesPerVector); + this->smem_iterator_A_.set_iteration_index(group_start_A); + + // Async Copy for operand A + CUTLASS_PRAGMA_UNROLL + for (int j = 0; j < Detail::kAccessesPerGroupA; ++j) { + if (group_start_A + j < Detail::AsyncCopyIterationsPerStageA) { + typename IteratorA::AccessType *dst_ptr = + reinterpret_cast( + this->smem_iterator_A_.get()); + + int const kSrcBytes = cutlass::sizeof_bits::value * + IteratorA::ThreadMap::kElementsPerAccess / + IteratorA::kAccessesPerVector / 8; + + CUTLASS_PRAGMA_UNROLL + for (int v = 0; v < IteratorA::kAccessesPerVector; ++v) { + auto gmem_ptr = iterator_A.get(); + + if (SharedMemoryClear == cutlass::gemm::SharedMemoryClearOption::kZfill) { + cutlass::arch::cp_async_zfill( + dst_ptr + v, gmem_ptr, iterator_A.valid()); + } else { + cutlass::arch::cp_async( + dst_ptr + v, gmem_ptr, iterator_A.valid()); + } + + ++iterator_A; + } + + ++this->smem_iterator_A_; + } + } + + iterator_B.set_iteration_index(group_start_B * + IteratorB::kAccessesPerVector); + this->smem_iterator_B_.set_iteration_index(group_start_B); + + // Async Copy for operand B + CUTLASS_PRAGMA_UNROLL + for (int j = 0; j < Detail::kAccessesPerGroupB; ++j) { + if (group_start_B + j < Detail::AsyncCopyIterationsPerStageB) { + typename IteratorB::AccessType *dst_ptr = + reinterpret_cast( + this->smem_iterator_B_.get()); + + int const kSrcBytes = cutlass::sizeof_bits::value * + IteratorB::ThreadMap::kElementsPerAccess / + IteratorB::kAccessesPerVector / 8; + + CUTLASS_PRAGMA_UNROLL + for (int v = 0; v < IteratorB::kAccessesPerVector; ++v) { + auto gmem_ptr = iterator_B.get(); + + if (SharedMemoryClear == cutlass::gemm::SharedMemoryClearOption::kZfill) { + cutlass::arch::cp_async_zfill( + dst_ptr + v, gmem_ptr, iterator_B.valid()); + } else { + cutlass::arch::cp_async( + dst_ptr + v, gmem_ptr, iterator_B.valid()); + } + + ++iterator_B; + } + ++this->smem_iterator_B_; + } + } + } + + /// Perform a threadblock-scoped matrix multiply-accumulate + CUTLASS_DEVICE + void operator()( + ///< problem size of GEMM + int gemm_k_iterations, + ///< destination accumulator tile + FragmentC &accum, + ///< iterator over A operand in global memory + IteratorA iterator_A, + ///< iterator over B operand in global memory + IteratorB iterator_B, + ///< initial value of accumulator + FragmentC const &src_accum) { + + // + // Prologue + // + + // Issue several complete stages + CUTLASS_PRAGMA_UNROLL + for (int stage = 0; stage < Base::kStages - 1; + ++stage, --gemm_k_iterations) { + + iterator_A.clear_mask(gemm_k_iterations == 0); + iterator_B.clear_mask(gemm_k_iterations == 0); + + iterator_A.set_iteration_index(0); + this->smem_iterator_A_.set_iteration_index(0); + + // Async Copy for operand A + CUTLASS_PRAGMA_UNROLL + for (int j = 0; j < Detail::AsyncCopyIterationsPerStageA; ++j) { + typename IteratorA::AccessType *dst_ptr = + reinterpret_cast( + this->smem_iterator_A_.get()); + + CUTLASS_PRAGMA_UNROLL + for (int v = 0; v < IteratorA::kAccessesPerVector; ++v) { + int const kSrcBytes = + cutlass::sizeof_bits::value * + IteratorA::ThreadMap::kElementsPerAccess / + IteratorA::kAccessesPerVector / 8; + + int src_bytes = (iterator_A.valid() ? kSrcBytes : 0); + + cutlass::arch::cp_async_zfill( + dst_ptr + v, iterator_A.get(), iterator_A.valid()); + + ++iterator_A; + } + + ++this->smem_iterator_A_; + } + + iterator_B.set_iteration_index(0); + this->smem_iterator_B_.set_iteration_index(0); + + // Async Copy for operand B + CUTLASS_PRAGMA_UNROLL + for (int j = 0; j < Detail::AsyncCopyIterationsPerStageB; ++j) { + typename IteratorB::AccessType *dst_ptr = + reinterpret_cast( + this->smem_iterator_B_.get()); + + CUTLASS_PRAGMA_UNROLL + for (int v = 0; v < IteratorB::kAccessesPerVector; ++v) { + int const kSrcBytes = + cutlass::sizeof_bits::value * + IteratorB::ThreadMap::kElementsPerAccess / + IteratorB::kAccessesPerVector / 8; + + cutlass::arch::cp_async_zfill( + dst_ptr + v, iterator_B.get(), iterator_B.valid()); + + ++iterator_B; + } + + ++this->smem_iterator_B_; + } + + // Move to the next stage + iterator_A.add_tile_offset({0, 1}); + iterator_B.add_tile_offset({1, 0}); + + this->smem_iterator_A_.add_tile_offset({0, 1}); + this->smem_iterator_B_.add_tile_offset({1, 0}); + + // Defines the boundary of a stage of cp.async. + cutlass::arch::cp_async_fence(); + } + + // Perform accumulation in the 'd' output operand + accum = src_accum; + + // + // Clear the remaining tiles of SMEM. This is a functional requirement for some kernels + // so that all accumulator elements outside the GEMM footprint are zero. + // + + if (SharedMemoryClear == cutlass::gemm::SharedMemoryClearOption::kClearLastStage) { + + /// Iterator to write threadblock-scoped tile of A operand to shared memory + SmemIteratorA last_smem_iterator_A(this->smem_iterator_A_); + + typename IteratorA::AccessType zero_A; + zero_A.clear(); + + last_smem_iterator_A.set_iteration_index(0); + + // Async Copy for operand A + CUTLASS_PRAGMA_UNROLL + for (int j = 0; j < Detail::AsyncCopyIterationsPerStageA; ++j) { + + typename IteratorA::AccessType *dst_ptr = + reinterpret_cast( + last_smem_iterator_A.get()); + + *dst_ptr = zero_A; + + ++last_smem_iterator_A; + } + + /// Iterator to write threadblock-scoped tile of B operand to shared memory + SmemIteratorB last_smem_iterator_B(this->smem_iterator_B_); + typename IteratorB::AccessType zero_B; + + zero_B.clear(); + last_smem_iterator_B.set_iteration_index(0); + + // Async Copy for operand B + CUTLASS_PRAGMA_UNROLL + for (int j = 0; j < Detail::AsyncCopyIterationsPerStageB; ++j) { + + typename IteratorB::AccessType *dst_ptr = + reinterpret_cast( + last_smem_iterator_B.get()); + + *dst_ptr = zero_B; + + ++last_smem_iterator_B; + } + } + + // Waits until kStages-2 stages have committed. + cutlass::arch::cp_async_wait(); + __syncthreads(); + + // Pair of fragments used to overlap shared memory loads and math + // instructions + WarpLoadedFragmentA warp_loaded_frag_A[2]; + WarpLoadedFragmentB warp_loaded_frag_B[2]; + + warp_loaded_frag_A[0].fill(additive_identity_); + warp_loaded_frag_A[1].fill(additive_identity_); + warp_loaded_frag_B[0].fill(additive_identity_); + warp_loaded_frag_B[1].fill(additive_identity_); + + WarpTransformedFragmentA warp_transformed_frag_A[2]; + WarpTransformedFragmentB warp_transformed_frag_B[2]; + + // TODO: see if we can get away without this, should be possible + warp_transformed_frag_A[0].fill(additive_identity_); + warp_transformed_frag_A[1].fill(additive_identity_); + warp_transformed_frag_B[0].fill(additive_identity_); + warp_transformed_frag_B[1].fill(additive_identity_); + + Operator warp_mma; + + this->warp_tile_iterator_A_.set_kgroup_index(0); + this->warp_tile_iterator_B_.set_kgroup_index(0); + + this->warp_tile_iterator_A_.load(warp_loaded_frag_A[0]); + this->warp_tile_iterator_B_.load(warp_loaded_frag_B[0]); + + ++this->warp_tile_iterator_A_; + ++this->warp_tile_iterator_B_; + + iterator_A.clear_mask(gemm_k_iterations == 0); + iterator_B.clear_mask(gemm_k_iterations == 0); + + int smem_write_stage_idx = Base::kStages - 1; + int smem_read_stage_idx = 0; + + warp_mma.transform(warp_transformed_frag_A[0], warp_transformed_frag_B[0], + warp_loaded_frag_A[0], warp_loaded_frag_B[0]); + + // + // Mainloop + // + + CUTLASS_GEMM_LOOP + for (; gemm_k_iterations > (-Base::kStages + 1);) { + // + // Loop over GEMM K dimension + // + + // Computes a warp-level GEMM on data held in shared memory + // Each "warp_mma_k" refers to a warp-level matrix multiply-accumulate + CUTLASS_PRAGMA_UNROLL + for (int warp_mma_k = 0; warp_mma_k < Base::kWarpGemmIterations; + ++warp_mma_k) { + + // Load warp-level tiles from shared memory, wrapping to k offset if + // this is the last group as the case may be. + + this->warp_tile_iterator_A_.set_kgroup_index((warp_mma_k + 1) % Base::kWarpGemmIterations); + this->warp_tile_iterator_B_.set_kgroup_index((warp_mma_k + 1) % Base::kWarpGemmIterations); + + this->warp_tile_iterator_A_.load(warp_loaded_frag_A[(warp_mma_k + 1) % 2]); + this->warp_tile_iterator_B_.load(warp_loaded_frag_B[(warp_mma_k + 1) % 2]); + + ++this->warp_tile_iterator_A_; + ++this->warp_tile_iterator_B_; + + if (warp_mma_k > 0) + warp_mma.transform(warp_transformed_frag_A[warp_mma_k % 2], + warp_transformed_frag_B[warp_mma_k % 2], + warp_loaded_frag_A[warp_mma_k % 2], + warp_loaded_frag_B[warp_mma_k % 2]); + + warp_mma( + accum, + warp_transformed_frag_A[warp_mma_k % 2], + warp_transformed_frag_B[warp_mma_k % 2], + accum + ); + + // Issue global->shared copies for the this stage + if (warp_mma_k < Base::kWarpGemmIterations - 1) { + int group_start_iteration_A, group_start_iteration_B; + + group_start_iteration_A = warp_mma_k * Detail::kAccessesPerGroupA; + group_start_iteration_B = warp_mma_k * Detail::kAccessesPerGroupB; + + copy_tiles_and_advance(iterator_A, iterator_B, group_start_iteration_A, + group_start_iteration_B); + } + + if (warp_mma_k + 2 == Base::kWarpGemmIterations) { + int group_start_iteration_A, group_start_iteration_B; + group_start_iteration_A = + (warp_mma_k + 1) * Detail::kAccessesPerGroupA; + group_start_iteration_B = + (warp_mma_k + 1) * Detail::kAccessesPerGroupB; + + copy_tiles_and_advance(iterator_A, iterator_B, group_start_iteration_A, + group_start_iteration_B); + + // Inserts a memory fence between stages of cp.async instructions. + cutlass::arch::cp_async_fence(); + + // Waits until kStages-2 stages have committed. + cutlass::arch::cp_async_wait(); + __syncthreads(); + + // Move to the next stage + iterator_A.add_tile_offset({0, 1}); + iterator_B.add_tile_offset({1, 0}); + + this->smem_iterator_A_.add_tile_offset({0, 1}); + this->smem_iterator_B_.add_tile_offset({1, 0}); + + // Add negative offsets to return iterators to the 'start' of the + // circular buffer in shared memory + if (smem_write_stage_idx == (Base::kStages - 1)) { + this->smem_iterator_A_.add_tile_offset({0, -Base::kStages}); + this->smem_iterator_B_.add_tile_offset({-Base::kStages, 0}); + smem_write_stage_idx = 0; + } else { + ++smem_write_stage_idx; + } + + if (smem_read_stage_idx == (Base::kStages - 1)) { + this->warp_tile_iterator_A_.add_tile_offset( + {0, -Base::kStages * Policy::kPartitionsK * + Base::kWarpGemmIterations}); + this->warp_tile_iterator_B_.add_tile_offset( + {-Base::kStages * Policy::kPartitionsK * + Base::kWarpGemmIterations, + 0}); + smem_read_stage_idx = 0; + } else { + ++smem_read_stage_idx; + } + + --gemm_k_iterations; + iterator_A.clear_mask(gemm_k_iterations == 0); + iterator_B.clear_mask(gemm_k_iterations == 0); + } + + // Do any conversions feeding the first stage at the end of the loop so + // we can start right away on mma instructions + if (warp_mma_k + 1 == Base::kWarpGemmIterations) + warp_mma.transform(warp_transformed_frag_A[(warp_mma_k + 1) % 2], + warp_transformed_frag_B[(warp_mma_k + 1) % 2], + warp_loaded_frag_A[(warp_mma_k + 1) % 2], + warp_loaded_frag_B[(warp_mma_k + 1) % 2]); + } + + } + + if (SharedMemoryClear == cutlass::gemm::SharedMemoryClearOption::kZfill) { + // commit and drain all pending and predicated LDGSTS pnz from the GEMM mainloop + cutlass::arch::cp_async_fence(); + cutlass::arch::cp_async_wait<0>(); + __syncthreads(); + } + + } +}; + +///////////////////////////////////////////////////////////////////////////////////////////////// + +} // namespace threadblock +} // namespace gemm +} // namespace cuasr + +///////////////////////////////////////////////////////////////////////////////////////////////// diff --git a/include/cuasr/gemm/warp/srmma_simt.h b/include/cuasr/gemm/warp/srmma_simt.h index f0e8141..2a7a32a 100644 --- a/include/cuasr/gemm/warp/srmma_simt.h +++ b/include/cuasr/gemm/warp/srmma_simt.h @@ -148,6 +148,8 @@ class SrmmaSimt { /// Storage for A tile using FragmentA = typename IteratorA::Fragment; + /// Storage for transformed A tile + using TransformedFragmentA = FragmentA; /// Iterates over the B operand in memory using IteratorB = cutlass::gemm::warp::MmaSimtTileIterator< @@ -162,6 +164,8 @@ class SrmmaSimt { /// Storage for B tile using FragmentB = typename IteratorB::Fragment; + /// Storage for transformed B tile + using TransformedFragmentB = FragmentB; /// Iterates over the C operand in memory using IteratorC = cutlass::gemm::warp::MmaSimtTileIterator< @@ -197,6 +201,15 @@ class SrmmaSimt { srmma(d, a, b, c); } + + /// Transform the mma operands to the required types + CUTLASS_DEVICE + void transform(TransformedFragmentA &dst_A, TransformedFragmentB &dst_B, + FragmentA const &A, FragmentB const &B) const { + //TODO: Implement this + dst_A = A; + dst_B = B; + } }; ///////////////////////////////////////////////////////////////////////////////////////////////// From 79643288bca3d6c45ff086afefd724655d9d21e1 Mon Sep 17 00:00:00 2001 From: Void Date: Wed, 3 Nov 2021 08:14:31 -0400 Subject: [PATCH 10/15] add default config benchmarks for ampere --- bench/device/CMakeLists.txt | 26 +- bench/device/sm80_defaults.cu | 4366 +++++++++++++++++++++++++++++++++ 2 files changed, 4388 insertions(+), 4 deletions(-) create mode 100644 bench/device/sm80_defaults.cu diff --git a/bench/device/CMakeLists.txt b/bench/device/CMakeLists.txt index ef85505..a10eeab 100644 --- a/bench/device/CMakeLists.txt +++ b/bench/device/CMakeLists.txt @@ -1,16 +1,34 @@ -# Just the default configurations -add_executable(cuasr_bench_srgemm_device_defaults +# SM50 defualt configurations +add_executable(cuasr_bench_srgemm_device_sm50_defaults sm50_defaults.cu ) target_include_directories( - cuasr_bench_srgemm_device_defaults + cuasr_bench_srgemm_device_sm50_defaults PRIVATE ${PROJECT_SOURCE_DIR}/include/ ${PROJECT_SOURCE_DIR}/tools/include/ ${PROJECT_SOURCE_DIR}/cutlass/include/ ${PROJECT_SOURCE_DIR}/cutlass/tools/util/include/ ) -target_link_libraries(cuasr_bench_srgemm_device_defaults +target_link_libraries(cuasr_bench_srgemm_device_sm50_defaults + benchmark + benchmark_main + ${cuASR_LIB_NAME} +) + +# SM80 defualt configurations +add_executable(cuasr_bench_srgemm_device_sm80_defaults + sm80_defaults.cu +) +target_include_directories( + cuasr_bench_srgemm_device_sm80_defaults + PRIVATE + ${PROJECT_SOURCE_DIR}/include/ + ${PROJECT_SOURCE_DIR}/tools/include/ + ${PROJECT_SOURCE_DIR}/cutlass/include/ + ${PROJECT_SOURCE_DIR}/cutlass/tools/util/include/ +) +target_link_libraries(cuasr_bench_srgemm_device_sm80_defaults benchmark benchmark_main ${cuASR_LIB_NAME} diff --git a/bench/device/sm80_defaults.cu b/bench/device/sm80_defaults.cu new file mode 100644 index 0000000..1357bff --- /dev/null +++ b/bench/device/sm80_defaults.cu @@ -0,0 +1,4366 @@ +/*************************************************************************************************** +* Copyright (c) 2021, Vijay Thakkar (thakkarv@gatech.edu). +**************************************************************************************************/ +////////////////////////////////////////////////////////////////////// +// THIS BENCHMARK FILE IS GENERATED AUTOMATICALLY : DO NOT MODIFY // +////////////////////////////////////////////////////////////////////// + +#include "benchmark/benchmark.h" + +#include "cuasr/gemm/device/default_srgemm_configuration.h" +#include "cuasr/gemm/device/srgemm.h" +#include "cuasr/functional.h" + +#include "harness.h" + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_plus_multiplies_dsrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_plus_multiplies_dsrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_plus_multiplies_dsrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_plus_multiplies_dsrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_plus_multiplies_dsrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_plus_multiplies_dsrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_plus_multiplies_dsrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_plus_multiplies_dsrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_plus_multiplies_dsrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_plus_multiplies_dsrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_plus_multiplies_dsrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_plus_multiplies_dsrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_plus_multiplies_dsrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_plus_multiplies_dsrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_plus_multiplies_dsrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_plus_multiplies_dsrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_plus_multiplies_ssrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_plus_multiplies_ssrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_plus_multiplies_ssrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_plus_multiplies_ssrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_plus_multiplies_ssrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_plus_multiplies_ssrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_plus_multiplies_ssrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_plus_multiplies_ssrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_plus_multiplies_ssrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_plus_multiplies_ssrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_plus_multiplies_ssrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_plus_multiplies_ssrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_plus_multiplies_ssrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_plus_multiplies_ssrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_plus_multiplies_ssrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_plus_multiplies_ssrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_plus_dsrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_plus_dsrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_plus_dsrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_plus_dsrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_plus_dsrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_plus_dsrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_plus_dsrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_plus_dsrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_plus_dsrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_plus_dsrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_plus_dsrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_plus_dsrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_plus_dsrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_plus_dsrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_plus_dsrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_plus_dsrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_plus_ssrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_plus_ssrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_plus_ssrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_plus_ssrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_plus_ssrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_plus_ssrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_plus_ssrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_plus_ssrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_plus_ssrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_plus_ssrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_plus_ssrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_plus_ssrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_plus_ssrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_plus_ssrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_plus_ssrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_plus_ssrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_plus_dsrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_plus_dsrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_plus_dsrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_plus_dsrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_plus_dsrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_plus_dsrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_plus_dsrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_plus_dsrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_plus_dsrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_plus_dsrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_plus_dsrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_plus_dsrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_plus_dsrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_plus_dsrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_plus_dsrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_plus_dsrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_plus_ssrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_plus_ssrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_plus_ssrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_plus_ssrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_plus_ssrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_plus_ssrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_plus_ssrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_plus_ssrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_plus_ssrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_plus_ssrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_plus_ssrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_plus_ssrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_plus_ssrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_plus_ssrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_plus_ssrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_plus_ssrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_maximum_dsrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_maximum_dsrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_maximum_dsrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_maximum_dsrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_maximum_dsrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_maximum_dsrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_maximum_dsrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_maximum_dsrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_maximum_dsrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_maximum_dsrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_maximum_dsrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_maximum_dsrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_maximum_dsrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_maximum_dsrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_maximum_dsrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_maximum_dsrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_maximum_ssrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_maximum_ssrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_maximum_ssrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_maximum_ssrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_maximum_ssrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_maximum_ssrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_maximum_ssrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_maximum_ssrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_maximum_ssrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_maximum_ssrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_maximum_ssrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_maximum_ssrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_maximum_ssrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_maximum_ssrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_maximum_ssrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_maximum_ssrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_minimum_dsrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_minimum_dsrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_minimum_dsrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_minimum_dsrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_minimum_dsrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_minimum_dsrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_minimum_dsrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_minimum_dsrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_minimum_dsrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_minimum_dsrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_minimum_dsrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_minimum_dsrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_minimum_dsrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_minimum_dsrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_minimum_dsrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_minimum_dsrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_minimum_ssrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_minimum_ssrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_minimum_ssrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_minimum_ssrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_minimum_ssrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_minimum_ssrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_minimum_ssrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_minimum_ssrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_minimum_ssrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_minimum_ssrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_minimum_ssrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_minimum_ssrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_minimum_ssrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_minimum_ssrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_minimum_ssrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_minimum_ssrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_multiplies_dsrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_multiplies_dsrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_multiplies_dsrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_multiplies_dsrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_multiplies_dsrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_multiplies_dsrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_multiplies_dsrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_multiplies_dsrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_multiplies_dsrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_multiplies_dsrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_multiplies_dsrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_multiplies_dsrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_multiplies_dsrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_multiplies_dsrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_multiplies_dsrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_multiplies_dsrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_multiplies_ssrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_multiplies_ssrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_multiplies_ssrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_multiplies_ssrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_multiplies_ssrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_multiplies_ssrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_multiplies_ssrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_multiplies_ssrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_multiplies_ssrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_multiplies_ssrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_multiplies_ssrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_multiplies_ssrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_multiplies_ssrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_multiplies_ssrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_minimum_multiplies_ssrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_minimum_multiplies_ssrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_multiplies_dsrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_multiplies_dsrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_multiplies_dsrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_multiplies_dsrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_multiplies_dsrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_multiplies_dsrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_multiplies_dsrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_multiplies_dsrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_multiplies_dsrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_multiplies_dsrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_multiplies_dsrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_multiplies_dsrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_multiplies_dsrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_multiplies_dsrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_multiplies_dsrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_multiplies_dsrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_multiplies_ssrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_multiplies_ssrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_multiplies_ssrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_multiplies_ssrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_multiplies_ssrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_multiplies_ssrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_multiplies_ssrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_multiplies_ssrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_multiplies_ssrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_multiplies_ssrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_multiplies_ssrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_multiplies_ssrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_multiplies_ssrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_multiplies_ssrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_maximum_multiplies_ssrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_maximum_multiplies_ssrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_binary_or_binary_and_dsrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_binary_or_binary_and_dsrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_binary_or_binary_and_dsrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_binary_or_binary_and_dsrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_binary_or_binary_and_dsrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_binary_or_binary_and_dsrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_binary_or_binary_and_dsrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_binary_or_binary_and_dsrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_binary_or_binary_and_dsrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_binary_or_binary_and_dsrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_binary_or_binary_and_dsrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_binary_or_binary_and_dsrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_binary_or_binary_and_dsrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_binary_or_binary_and_dsrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_binary_or_binary_and_dsrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_binary_or_binary_and_dsrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_binary_or_binary_and_ssrgemm_tt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_binary_or_binary_and_ssrgemm_tt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_binary_or_binary_and_ssrgemm_tt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_binary_or_binary_and_ssrgemm_tt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_binary_or_binary_and_ssrgemm_tn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_binary_or_binary_and_ssrgemm_tn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_binary_or_binary_and_ssrgemm_tn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_binary_or_binary_and_ssrgemm_tn_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_binary_or_binary_and_ssrgemm_nt_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_binary_or_binary_and_ssrgemm_nt_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_binary_or_binary_and_ssrgemm_nt_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_binary_or_binary_and_ssrgemm_nt_t) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_binary_or_binary_and_ssrgemm_nn_n(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_binary_or_binary_and_ssrgemm_nn_n) + ->RangeMultiplier(2)->Range(256, 4096); + +/////////////////////////////////////////////////////////////////////////////// + +static void BM_SM80_device_binary_or_binary_and_ssrgemm_nn_t(benchmark::State &state) { + const auto N = static_cast(state.range(0)); + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm80; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, OpClass, SmArch>; + + // setup bench harness + cuasr::bench::device::BenchHarness bench({ N, N, N }); + + // benchmark loop + for (auto _ : state) { + benchmark::DoNotOptimize(bench.run()); + cudaDeviceSynchronize(); + } + + double flops_per_itr = 2.0 * N * N * N; + state.counters["Flop/s"] + = benchmark::Counter(flops_per_itr, benchmark::Counter::kIsIterationInvariantRate); +} +BENCHMARK(BM_SM80_device_binary_or_binary_and_ssrgemm_nn_t) + ->RangeMultiplier(2)->Range(256, 4096); From bf1a4e20ef15ea5763a4d07eb6caeab95bfe05a7 Mon Sep 17 00:00:00 2001 From: Void Date: Wed, 3 Nov 2021 14:41:08 -0400 Subject: [PATCH 11/15] add default srgemm configs for SM80 and bind to multistage kernel --- .../device/default_srgemm_configuration.h | 32 ++++++++-------- include/cuasr/gemm/kernel/default_srgemm.h | 4 +- .../cuasr/gemm/threadblock/default_srmma.h | 8 +--- .../cuasr/gemm/threadblock/srmma_multistage.h | 38 +++++++++---------- 4 files changed, 38 insertions(+), 44 deletions(-) diff --git a/include/cuasr/gemm/device/default_srgemm_configuration.h b/include/cuasr/gemm/device/default_srgemm_configuration.h index 73665e1..b3f7317 100644 --- a/include/cuasr/gemm/device/default_srgemm_configuration.h +++ b/include/cuasr/gemm/device/default_srgemm_configuration.h @@ -295,8 +295,8 @@ struct DefaultSemiRingConfiguration< static int constexpr kAlignmentA = 1; static int constexpr kAlignmentB = 1; - using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 8>; - using WarpShape = cutlass::gemm::GemmShape<32, 64, 8>; + using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 16>; + using WarpShape = cutlass::gemm::GemmShape<32, 64, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; static int constexpr kStages = 3; @@ -322,8 +322,8 @@ struct DefaultSemiRingConfiguration< static int constexpr kAlignmentA = 1; static int constexpr kAlignmentB = 1; - using ThreadblockShape = cutlass::gemm::GemmShape<128, 128, 8>; - using WarpShape = cutlass::gemm::GemmShape<64, 32, 8>; + using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 16>; + using WarpShape = cutlass::gemm::GemmShape<32, 64, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; static int constexpr kStages = 3; @@ -349,8 +349,8 @@ struct DefaultSemiRingConfiguration< static int constexpr kAlignmentA = 1; static int constexpr kAlignmentB = 1; - using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 8>; - using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; + using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 16>; + using WarpShape = cutlass::gemm::GemmShape<32, 64, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; static int constexpr kStages = 3; @@ -375,8 +375,8 @@ struct DefaultSemiRingConfiguration< static int constexpr kAlignmentA = 1; static int constexpr kAlignmentB = 1; - using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 8>; - using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; + using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 16>; + using WarpShape = cutlass::gemm::GemmShape<32, 64, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; static int constexpr kStages = 3; @@ -401,8 +401,8 @@ struct DefaultSemiRingConfiguration< static int constexpr kAlignmentA = 1; static int constexpr kAlignmentB = 1; - using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 8>; - using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; + using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 16>; + using WarpShape = cutlass::gemm::GemmShape<32, 64, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; static int constexpr kStages = 3; @@ -427,8 +427,8 @@ struct DefaultSemiRingConfiguration< static int constexpr kAlignmentA = 1; static int constexpr kAlignmentB = 1; - using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 8>; - using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; + using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 16>; + using WarpShape = cutlass::gemm::GemmShape<32, 64, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; static int constexpr kStages = 3; @@ -453,8 +453,8 @@ struct DefaultSemiRingConfiguration< static int constexpr kAlignmentA = 1; static int constexpr kAlignmentB = 1; - using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 8>; - using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; + using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 16>; + using WarpShape = cutlass::gemm::GemmShape<32, 64, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; static int constexpr kStages = 3; @@ -479,8 +479,8 @@ struct DefaultSemiRingConfiguration< static int constexpr kAlignmentA = 1; static int constexpr kAlignmentB = 1; - using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 8>; - using WarpShape = cutlass::gemm::GemmShape<16, 64, 8>; + using ThreadblockShape = cutlass::gemm::GemmShape<64, 128, 16>; + using WarpShape = cutlass::gemm::GemmShape<32, 64, 16>; using InstructionShape = cutlass::gemm::GemmShape<1, 1, 1>; static int constexpr kStages = 3; diff --git a/include/cuasr/gemm/kernel/default_srgemm.h b/include/cuasr/gemm/kernel/default_srgemm.h index b85d2d9..8f7508d 100644 --- a/include/cuasr/gemm/kernel/default_srgemm.h +++ b/include/cuasr/gemm/kernel/default_srgemm.h @@ -105,8 +105,6 @@ template < typename ElementC, /// Element type for internal accumulation typename ElementAccumulator, - /// Tag indicating architecture to tune for - typename ArchTag, /// Threadblock-level tile size (concept: GemmShape) typename ThreadblockShape, /// Warp-level tile size (concept: GemmShape) @@ -133,7 +131,7 @@ struct DefaultSrgemm< cutlass::layout::RowMajor, ElementAccumulator, cutlass::arch::OpClassSimt, - ArchTag, + cutlass::arch::Sm50, ThreadblockShape, WarpShape, cutlass::gemm::GemmShape<1, 1, 1>, diff --git a/include/cuasr/gemm/threadblock/default_srmma.h b/include/cuasr/gemm/threadblock/default_srmma.h index 147a1b0..30e14c8 100644 --- a/include/cuasr/gemm/threadblock/default_srmma.h +++ b/include/cuasr/gemm/threadblock/default_srmma.h @@ -83,8 +83,6 @@ template < int kAlignmentB, /// Element type for internal accumulation typename ElementAccumulator, - /// Tag indicating architecture to tune for - typename ArchTag, /// Threadblock-level tile size (concept: GemmShape) typename ThreadblockShape, /// Warp-level tile size (concept: GemmShape) @@ -97,7 +95,7 @@ template < typename MultiplicationOp> struct DefaultSrmma { // Define the SrmmaCore components using SrmmaCore = typename cuasr::gemm::threadblock::DefaultSrmmaCore< @@ -142,8 +140,6 @@ template < int kAlignmentB, /// Element type for internal accumulation typename ElementAccumulator, - /// Tag indicating architecture to tune for - typename ArchTag, /// Threadblock-level tile size (concept: GemmShape) typename ThreadblockShape, /// Warp-level tile size (concept: GemmShape) @@ -159,7 +155,7 @@ template < struct DefaultSrmma { diff --git a/include/cuasr/gemm/threadblock/srmma_multistage.h b/include/cuasr/gemm/threadblock/srmma_multistage.h index dfea1d5..ae021ab 100644 --- a/include/cuasr/gemm/threadblock/srmma_multistage.h +++ b/include/cuasr/gemm/threadblock/srmma_multistage.h @@ -444,14 +444,14 @@ class SrmmaMultistage : warp_loaded_frag_B[0].fill(additive_identity_); warp_loaded_frag_B[1].fill(additive_identity_); - WarpTransformedFragmentA warp_transformed_frag_A[2]; - WarpTransformedFragmentB warp_transformed_frag_B[2]; + // WarpTransformedFragmentA warp_transformed_frag_A[2]; + // WarpTransformedFragmentB warp_transformed_frag_B[2]; // TODO: see if we can get away without this, should be possible - warp_transformed_frag_A[0].fill(additive_identity_); - warp_transformed_frag_A[1].fill(additive_identity_); - warp_transformed_frag_B[0].fill(additive_identity_); - warp_transformed_frag_B[1].fill(additive_identity_); + // warp_transformed_frag_A[0].fill(additive_identity_); + // warp_transformed_frag_A[1].fill(additive_identity_); + // warp_transformed_frag_B[0].fill(additive_identity_); + // warp_transformed_frag_B[1].fill(additive_identity_); Operator warp_mma; @@ -470,8 +470,8 @@ class SrmmaMultistage : int smem_write_stage_idx = Base::kStages - 1; int smem_read_stage_idx = 0; - warp_mma.transform(warp_transformed_frag_A[0], warp_transformed_frag_B[0], - warp_loaded_frag_A[0], warp_loaded_frag_B[0]); + // warp_mma.transform(warp_transformed_frag_A[0], warp_transformed_frag_B[0], + // warp_loaded_frag_A[0], warp_loaded_frag_B[0]); // // Mainloop @@ -502,15 +502,15 @@ class SrmmaMultistage : ++this->warp_tile_iterator_B_; if (warp_mma_k > 0) - warp_mma.transform(warp_transformed_frag_A[warp_mma_k % 2], - warp_transformed_frag_B[warp_mma_k % 2], - warp_loaded_frag_A[warp_mma_k % 2], - warp_loaded_frag_B[warp_mma_k % 2]); + // warp_mma.transform(warp_transformed_frag_A[warp_mma_k % 2], + // warp_transformed_frag_B[warp_mma_k % 2], + // warp_loaded_frag_A[warp_mma_k % 2], + // warp_loaded_frag_B[warp_mma_k % 2]); warp_mma( accum, - warp_transformed_frag_A[warp_mma_k % 2], - warp_transformed_frag_B[warp_mma_k % 2], + warp_loaded_frag_A[warp_mma_k % 2], + warp_loaded_frag_B[warp_mma_k % 2], accum ); @@ -579,11 +579,11 @@ class SrmmaMultistage : // Do any conversions feeding the first stage at the end of the loop so // we can start right away on mma instructions - if (warp_mma_k + 1 == Base::kWarpGemmIterations) - warp_mma.transform(warp_transformed_frag_A[(warp_mma_k + 1) % 2], - warp_transformed_frag_B[(warp_mma_k + 1) % 2], - warp_loaded_frag_A[(warp_mma_k + 1) % 2], - warp_loaded_frag_B[(warp_mma_k + 1) % 2]); + // if (warp_mma_k + 1 == Base::kWarpGemmIterations) + // warp_mma.transform(warp_transformed_frag_A[(warp_mma_k + 1) % 2], + // warp_transformed_frag_B[(warp_mma_k + 1) % 2], + // warp_loaded_frag_A[(warp_mma_k + 1) % 2], + // warp_loaded_frag_B[(warp_mma_k + 1) % 2]); } } From a7ba0cc55dd2a394a5891722cb8b16e155265b13 Mon Sep 17 00:00:00 2001 From: Void Date: Wed, 3 Nov 2021 14:41:25 -0400 Subject: [PATCH 12/15] change CMake default CUDA arch to SM80 --- CMakeLists.txt | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/CMakeLists.txt b/CMakeLists.txt index ae527f2..1f03d90 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -23,7 +23,7 @@ option(CUASR_BENCH "Build cuASR benchmark suite." ON) option(CUASR_EXAMPLE "Build cuASR examples." ON) # By default, build fat binaries. TODO add sm_80 here -option(CUASR_CUDA_ARCHS "List of CUDA architectures to compile for." "60 61 70 72 75") +option(CUASR_CUDA_ARCHS "List of CUDA architectures to compile for." "80") # CUDA native compiler (nvcc) only supports upto C++14 for now find_package(CUDA REQUIRED) From 62ae551b3421763b766679ac544fd179bbc3e3f5 Mon Sep 17 00:00:00 2001 From: Void Date: Thu, 11 Nov 2021 15:45:39 -0500 Subject: [PATCH 13/15] add default test generator, SM50 defualt tests --- test/device/CMakeLists.txt | 39 +- test/device/gen_defualt_test.py | 173 ++ test/device/sm50_defaults.cu | 2713 +++++++++++++++++++++++++++++++ 3 files changed, 2917 insertions(+), 8 deletions(-) create mode 100644 test/device/gen_defualt_test.py create mode 100644 test/device/sm50_defaults.cu diff --git a/test/device/CMakeLists.txt b/test/device/CMakeLists.txt index 328a9ea..ead4942 100644 --- a/test/device/CMakeLists.txt +++ b/test/device/CMakeLists.txt @@ -1,27 +1,50 @@ -file(GLOB SIMT_TEST_SRCS CONFIGURE_DEPENDS *.cu) -add_executable(cuasr_test_srgemm_device +# SM50 default tests +add_executable(cuasr_test_srgemm_device_sm50_defaults ${PROJECT_SOURCE_DIR}/test/harness.cpp - ${SIMT_TEST_SRCS} + sm50_defaults.cu ) target_include_directories( - cuasr_test_srgemm_device + cuasr_test_srgemm_device_sm50_defaults PRIVATE ${PROJECT_SOURCE_DIR}/include/ ${PROJECT_SOURCE_DIR}/tools/include/ ${PROJECT_SOURCE_DIR}/cutlass/include/ ${PROJECT_SOURCE_DIR}/cutlass/tools/util/include/ ) -target_link_libraries(cuasr_test_srgemm_device +target_link_libraries(cuasr_test_srgemm_device_sm50_defaults gtest ${cuASR_LIB_NAME} ) add_test( - NAME cuasr_test_srgemm_device - COMMAND cuasr_test_srgemm_device + NAME cuasr_test_srgemm_device_sm50_defaults + COMMAND cuasr_test_srgemm_device_sm50_defaults +) + +# SM50 all shmoo tests +file(GLOB SM50_SIMT_TEST_SRCS CONFIGURE_DEPENDS sm50_simt_*.cu) +add_executable(cuasr_test_srgemm_device_sm50_shmoo + ${PROJECT_SOURCE_DIR}/test/harness.cpp + ${SM50_SIMT_TEST_SRCS} +) +target_include_directories( + cuasr_test_srgemm_device_sm50_shmoo + PRIVATE + ${PROJECT_SOURCE_DIR}/include/ + ${PROJECT_SOURCE_DIR}/tools/include/ + ${PROJECT_SOURCE_DIR}/cutlass/include/ + ${PROJECT_SOURCE_DIR}/cutlass/tools/util/include/ +) +target_link_libraries(cuasr_test_srgemm_device_sm50_shmoo + gtest + ${cuASR_LIB_NAME} +) +add_test( + NAME cuasr_test_srgemm_device_sm50_shmoo + COMMAND cuasr_test_srgemm_device_sm50_shmoo ) if(NOT DEFINED CUASR_TEST_LEVEL) set(CUASR_TEST_LEVEL 0) endif() -target_compile_definitions(cuasr_test_srgemm_device +target_compile_definitions(cuasr_test_srgemm_device_sm50_shmoo PRIVATE CUASR_TEST_LEVEL=${CUASR_TEST_LEVEL} ) diff --git a/test/device/gen_defualt_test.py b/test/device/gen_defualt_test.py new file mode 100644 index 0000000..97dd5d6 --- /dev/null +++ b/test/device/gen_defualt_test.py @@ -0,0 +1,173 @@ +import os +import sys +import argparse + +################################################################################ +# This file generates teset cases for all defualt SRGEMM configurations. +################################################################################ + +precisions = [ + ["d", "double"], + ["s", "float"], +] + +transposes = [ + [False, False, True], + [False, False, False], + [False, True, True], + [False, True, False], + [True, False, True], + [True, False, False], + [True, True, True], + [True, True, False], +] + +semiring_operators = [ + ["plus", "multiplies"], # regular GEMM + ["minimum", "plus"], # min-plus (tropical) + ["maximum", "plus"], # max-plus + ["minimum", "maximum"], # min-max + ["maximum", "minimum"], # max-min + ["minimum", "multiplies"], # min-multiplies + ["maximum", "multiplies"], # max-multiplies + ["binary_or", "binary_and"] # or-and +] + + +testfile_header = """\ +/*************************************************************************************************** +* Copyright (c) 2021, Vijay Thakkar (thakkarv@gatech.edu). +**************************************************************************************************/ +///////////////////////////////////////////////////////////////// +// THIS TEST FILE IS GENERATED AUTOMATICALLY : DO NOT MODIFY // +///////////////////////////////////////////////////////////////// + +#include "gtest/gtest.h" + +/// from upstream cutlass +#include "cutlass/cutlass.h" +#include "cutlass/gemm/gemm.h" +#include "cutlass/gemm/threadblock/threadblock_swizzle.h" + +/// from cuasr lib +#include "cuasr/gemm/device/default_srgemm_configuration.h" +#include "cuasr/gemm/device/srgemm.h" +#include "cuasr/functional.h" + +/// from cuasr tools +#include "cuasr/reference/srgemm/host_srgemm.h" + +/// from local test dir +#include "testbed.h" + +""" + + +test_template = """\ + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM{sm_arch}_device_{add_op}_{mult_op}_{precision_char}srgemm_{transA}{transB}_{transC}, default) {{ + using precision = {precision_type}; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm{sm_arch}; + + using AddOp = cuasr::{add_op}; + using MultOp = cuasr::{mult_op}; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::{trans_typeA}Major, // + precision, cutlass::layout::{trans_typeB}Major, // + precision, cutlass::layout::{trans_typeC}Major, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +}} + +""" + + +def write_test_file_header(testfile): + testfile.write(testfile_header) + + +def write_test_to_file( + testfile, + sm_arch, + add_op, + mult_op, + precision_char, + precision_type, + transA, + transB, + transC): + trans_typeA = "Column" if transA == "n" else "Row" + trans_typeB = "Column" if transB == "n" else "Row" + trans_typeC = "Column" if transC == "n" else "Row" + testfile.write(test_template.format( + sm_arch=sm_arch, + add_op=add_op, + mult_op=mult_op, + precision_char=precision_char, + precision_type=precision_type, + transA=transA, + transB=transB, + transC=transC, + trans_typeA=trans_typeA, + trans_typeB=trans_typeB, + trans_typeC=trans_typeC + )) + + +def main(args): + num_testes = 0 + testfile_name = "sm{}_defaults.cu".format(args.sm_arch) + print(testfile_name) + filePath = os.path.join(args.output_dir, testfile_name) + + # open file and gen all default tests + with open(filePath, "w") as testfile: + write_test_file_header(testfile) + + # for all semirings + for add_op, mult_op in semiring_operators: + # for all precisions + for precision in precisions: + precision_char = precision[0] + precision_type = precision[1] + + # transposes + for transpose in transposes: + # get transpose char + column_major_A = transpose[0] + column_major_B = transpose[1] + column_major_C = transpose[2] + transA = "n" if column_major_A else "t" + transB = "n" if column_major_B else "t" + transC = "n" if column_major_C else "t" + + # write to file + write_test_to_file( + testfile, + args.sm_arch, + add_op, + mult_op, + precision_char, + precision_type, + transA, + transB, + transC) + num_testes += 1 + print("Total test count per semi-ring = {}".format( + num_testes // len(semiring_operators))) + + +if __name__ == "__main__": + parser = argparse.ArgumentParser() + parser.add_argument("-o", "--output-dir", type=str, required=False, default=".", + help="Path to the output dir.") + parser.add_argument("-sm", "--sm-arch", type=int, required=False, default=50, choices=[50, 80], + help="SM architecture version number,") + args = parser.parse_args(sys.argv[1:]) + main(args) diff --git a/test/device/sm50_defaults.cu b/test/device/sm50_defaults.cu new file mode 100644 index 0000000..17c3e05 --- /dev/null +++ b/test/device/sm50_defaults.cu @@ -0,0 +1,2713 @@ +/*************************************************************************************************** +* Copyright (c) 2021, Vijay Thakkar (thakkarv@gatech.edu). +**************************************************************************************************/ +///////////////////////////////////////////////////////////////// +// THIS TEST FILE IS GENERATED AUTOMATICALLY : DO NOT MODIFY // +///////////////////////////////////////////////////////////////// + +#include "gtest/gtest.h" + +/// from upstream cutlass +#include "cutlass/cutlass.h" +#include "cutlass/gemm/gemm.h" +#include "cutlass/gemm/threadblock/threadblock_swizzle.h" + +/// from cuasr lib +#include "cuasr/gemm/device/default_srgemm_configuration.h" +#include "cuasr/gemm/device/srgemm.h" +#include "cuasr/functional.h" + +/// from cuasr tools +#include "cuasr/reference/srgemm/host_srgemm.h" + +/// from local test dir +#include "testbed.h" + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_plus_multiplies_dsrgemm_tt_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_plus_multiplies_dsrgemm_tt_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_plus_multiplies_dsrgemm_tn_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_plus_multiplies_dsrgemm_tn_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_plus_multiplies_dsrgemm_nt_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_plus_multiplies_dsrgemm_nt_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_plus_multiplies_dsrgemm_nn_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_plus_multiplies_dsrgemm_nn_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_plus_multiplies_ssrgemm_tt_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_plus_multiplies_ssrgemm_tt_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_plus_multiplies_ssrgemm_tn_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_plus_multiplies_ssrgemm_tn_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_plus_multiplies_ssrgemm_nt_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_plus_multiplies_ssrgemm_nt_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_plus_multiplies_ssrgemm_nn_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_plus_multiplies_ssrgemm_nn_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::plus; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_plus_dsrgemm_tt_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_plus_dsrgemm_tt_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_plus_dsrgemm_tn_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_plus_dsrgemm_tn_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_plus_dsrgemm_nt_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_plus_dsrgemm_nt_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_plus_dsrgemm_nn_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_plus_dsrgemm_nn_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_plus_ssrgemm_tt_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_plus_ssrgemm_tt_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_plus_ssrgemm_tn_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_plus_ssrgemm_tn_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_plus_ssrgemm_nt_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_plus_ssrgemm_nt_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_plus_ssrgemm_nn_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_plus_ssrgemm_nn_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_plus_dsrgemm_tt_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_plus_dsrgemm_tt_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_plus_dsrgemm_tn_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_plus_dsrgemm_tn_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_plus_dsrgemm_nt_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_plus_dsrgemm_nt_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_plus_dsrgemm_nn_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_plus_dsrgemm_nn_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_plus_ssrgemm_tt_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_plus_ssrgemm_tt_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_plus_ssrgemm_tn_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_plus_ssrgemm_tn_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_plus_ssrgemm_nt_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_plus_ssrgemm_nt_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_plus_ssrgemm_nn_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_plus_ssrgemm_nn_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::plus; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_maximum_dsrgemm_tt_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_maximum_dsrgemm_tt_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_maximum_dsrgemm_tn_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_maximum_dsrgemm_tn_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_maximum_dsrgemm_nt_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_maximum_dsrgemm_nt_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_maximum_dsrgemm_nn_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_maximum_dsrgemm_nn_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_maximum_ssrgemm_tt_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_maximum_ssrgemm_tt_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_maximum_ssrgemm_tn_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_maximum_ssrgemm_tn_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_maximum_ssrgemm_nt_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_maximum_ssrgemm_nt_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_maximum_ssrgemm_nn_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_maximum_ssrgemm_nn_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::maximum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_minimum_dsrgemm_tt_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_minimum_dsrgemm_tt_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_minimum_dsrgemm_tn_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_minimum_dsrgemm_tn_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_minimum_dsrgemm_nt_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_minimum_dsrgemm_nt_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_minimum_dsrgemm_nn_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_minimum_dsrgemm_nn_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_minimum_ssrgemm_tt_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_minimum_ssrgemm_tt_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_minimum_ssrgemm_tn_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_minimum_ssrgemm_tn_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_minimum_ssrgemm_nt_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_minimum_ssrgemm_nt_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_minimum_ssrgemm_nn_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_minimum_ssrgemm_nn_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::minimum; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_multiplies_dsrgemm_tt_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_multiplies_dsrgemm_tt_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_multiplies_dsrgemm_tn_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_multiplies_dsrgemm_tn_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_multiplies_dsrgemm_nt_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_multiplies_dsrgemm_nt_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_multiplies_dsrgemm_nn_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_multiplies_dsrgemm_nn_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_multiplies_ssrgemm_tt_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_multiplies_ssrgemm_tt_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_multiplies_ssrgemm_tn_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_multiplies_ssrgemm_tn_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_multiplies_ssrgemm_nt_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_multiplies_ssrgemm_nt_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_multiplies_ssrgemm_nn_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_minimum_multiplies_ssrgemm_nn_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::minimum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_multiplies_dsrgemm_tt_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_multiplies_dsrgemm_tt_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_multiplies_dsrgemm_tn_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_multiplies_dsrgemm_tn_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_multiplies_dsrgemm_nt_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_multiplies_dsrgemm_nt_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_multiplies_dsrgemm_nn_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_multiplies_dsrgemm_nn_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_multiplies_ssrgemm_tt_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_multiplies_ssrgemm_tt_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_multiplies_ssrgemm_tn_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_multiplies_ssrgemm_tn_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_multiplies_ssrgemm_nt_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_multiplies_ssrgemm_nt_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_multiplies_ssrgemm_nn_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_maximum_multiplies_ssrgemm_nn_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::maximum; + using MultOp = cuasr::multiplies; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_binary_or_binary_and_dsrgemm_tt_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_binary_or_binary_and_dsrgemm_tn_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_binary_or_binary_and_dsrgemm_nt_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_n, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_binary_or_binary_and_dsrgemm_nn_t, default) { + using precision = double; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_binary_or_binary_and_ssrgemm_tt_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_binary_or_binary_and_ssrgemm_tn_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_binary_or_binary_and_ssrgemm_nt_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_n, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + + +/////////////////////////////////////////////////////////////////////////////// + +TEST(SM50_device_binary_or_binary_and_ssrgemm_nn_t, default) { + using precision = float; + using OpClass = cutlass::arch::OpClassSimt; + using SmArch = cutlass::arch::Sm50; + + using AddOp = cuasr::binary_or; + using MultOp = cuasr::binary_and; + + using Srgemm = cuasr::gemm::device::Srgemm< // + AddOp, MultOp, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::ColumnMajor, // + precision, cutlass::layout::RowMajor, + precision, OpClass, SmArch>; + + EXPECT_TRUE(cuasr::test::gemm::device::TestAllGemm()); +} + From e6c89620024652cd5e5859d929525655900d574f Mon Sep 17 00:00:00 2001 From: Void Date: Thu, 23 Dec 2021 12:49:12 -0500 Subject: [PATCH 14/15] remove cuASR CUDA Archs and use CMAKE_CUDA_ARCHITECTURES --- CMakeLists.txt | 6 ++---- README.md | 4 ++-- 2 files changed, 4 insertions(+), 6 deletions(-) diff --git a/CMakeLists.txt b/CMakeLists.txt index 1f03d90..f888c5a 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -22,9 +22,6 @@ option(CUASR_TEST "Build cuASR test suite. Use with CUASR_TEST_LEVEL={0|1|2}. option(CUASR_BENCH "Build cuASR benchmark suite." ON) option(CUASR_EXAMPLE "Build cuASR examples." ON) -# By default, build fat binaries. TODO add sm_80 here -option(CUASR_CUDA_ARCHS "List of CUDA architectures to compile for." "80") - # CUDA native compiler (nvcc) only supports upto C++14 for now find_package(CUDA REQUIRED) set(CMAKE_CXX_EXTENSIONS OFF) @@ -46,7 +43,7 @@ set(cuASR_CUDA_FLAGS --expt-relaxed-constexpr) set(cuASR_CUDA_FLAGS_DEBUG -G ${cuASR_CUDA_FLAGS}) set(cuASR_CUDA_FLAGS_RELEASE -O3 ${cuASR_CUDA_FLAGS}) set(cuASR_CUDA_FLAGS_RELWITHDEBINFO -G ${cuASR_CUDA_FLAGS}) -set(CMAKE_CUDA_ARCHITECTURES ${CUASR_CUDA_ARCHS}) +set(CMAKE_CUDA_ARCHITECTURES "80") # the sub-modules update themselves with git, so find git find_package(Git QUIET) @@ -99,6 +96,7 @@ message(STATUS " C++ Compiler : ${CMAKE_CXX_COMPILER}") message(STATUS " C++ Compiler version : ${CMAKE_CXX_COMPILER_VERSION}") message(STATUS " CUDA Compiler : ${CMAKE_CUDA_COMPILER}") message(STATUS " CUDA Compiler version: ${CMAKE_CUDA_COMPILER_VERSION}") +message(STATUS " CUDA Arch support : ${CMAKE_CUDA_ARCHITECTURES}") message(STATUS " Build tests : ${CUASR_TEST}") message(STATUS " Test level : ${CUASR_TEST_LEVEL}") message(STATUS " Build benchmarks : ${CUASR_BENCH}") diff --git a/README.md b/README.md index 0fcd465..73b4d0f 100644 --- a/README.md +++ b/README.md @@ -24,7 +24,7 @@ cuASR is a template library and therefore header only, but includes an exhaustiv $ git clone --recurse-submodules https://github.com/hpcgarage/cuASR /path/to/repo $ cd /path/to/repo $ mkdir build && cd build -$ cmake .. -G Ninja -DCUASR_CUDA_ARCHS="70 75" +$ cmake .. -G Ninja -DCMAKE_CUDA_ARCHITECTURES="70 75 80" $ ninja ``` @@ -34,7 +34,7 @@ Notable build flags: | Build Flag | Usage Description | |-|-| -| `CUASR_CUDA_ARCHS` | lists the CUDA SM architectures the fat binaries should be built to target. `CUASR_CUDA_ARCHS="60 61 70 72 75"` (all Pascal and Volta GPUs) will be used if no value is specified, but this can really hurt compile times for tests and benchmarks; Limit CUDA architectures to the smallest subset you forsee running the tests and benchmarks on. +| `CMAKE_CUDA_ARCHITECTURES` | lists the CUDA SM architectures the fat binaries should be built to target. `CMAKE_CUDA_ARCHITECTURES="80"` (Ampere) will be used if no value is specified, but this can really hurt compile times for tests and benchmarks; Limit CUDA architectures to the smallest subset you forsee running the tests and benchmarks on. | `CUASR_TEST` | Set to `ON` by default and controls whether tests will be built or not. Set to `OFF` to disable building all tests. | | `CUASR_BENCH` | Set to `ON` by default and controls whether benchmarks will be built or not. Set to `OFF` to disable building all benchmarks. | | `CUASR_EXAMPLES` | Set to `ON` by default and controls whether examples will be built or not. Set to `OFF` to disable building all examples. | From 689edcfb9f6e22856db9eef348dc151a7908ea61 Mon Sep 17 00:00:00 2001 From: Void Date: Fri, 8 Apr 2022 09:46:21 -0400 Subject: [PATCH 15/15] cmake: fix broken option for user defined CUDA arch --- CMakeLists.txt | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/CMakeLists.txt b/CMakeLists.txt index f888c5a..009a306 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -43,7 +43,9 @@ set(cuASR_CUDA_FLAGS --expt-relaxed-constexpr) set(cuASR_CUDA_FLAGS_DEBUG -G ${cuASR_CUDA_FLAGS}) set(cuASR_CUDA_FLAGS_RELEASE -O3 ${cuASR_CUDA_FLAGS}) set(cuASR_CUDA_FLAGS_RELWITHDEBINFO -G ${cuASR_CUDA_FLAGS}) -set(CMAKE_CUDA_ARCHITECTURES "80") +if (NOT CMAKE_CUDA_ARCHITECTURES) + set(CMAKE_CUDA_ARCHITECTURES "80") +endif() # the sub-modules update themselves with git, so find git find_package(Git QUIET)